markupr 2.1.8
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude/commands/review-feedback.md +47 -0
- package/.eslintrc.json +35 -0
- package/.github/CODEOWNERS +16 -0
- package/.github/FUNDING.yml +1 -0
- package/.github/ISSUE_TEMPLATE/bug_report.md +56 -0
- package/.github/ISSUE_TEMPLATE/feature_request.md +54 -0
- package/.github/PULL_REQUEST_TEMPLATE.md +89 -0
- package/.github/dependabot.yml +70 -0
- package/.github/workflows/ci.yml +184 -0
- package/.github/workflows/deploy-landing.yml +134 -0
- package/.github/workflows/nightly.yml +288 -0
- package/.github/workflows/release.yml +318 -0
- package/CHANGELOG.md +127 -0
- package/CLAUDE.md +137 -0
- package/CODE_OF_CONDUCT.md +9 -0
- package/CONTRIBUTING.md +390 -0
- package/LICENSE +21 -0
- package/PRODUCT_VISION.md +277 -0
- package/README.md +517 -0
- package/SECURITY.md +51 -0
- package/SIGNING_INSTRUCTIONS.md +284 -0
- package/assets/DMG_BACKGROUND_INSTRUCTIONS.md +130 -0
- package/assets/svg-source/dmg-background.svg +70 -0
- package/assets/svg-source/icon.svg +20 -0
- package/assets/svg-source/tray-icon-processing.svg +7 -0
- package/assets/svg-source/tray-icon-recording.svg +7 -0
- package/assets/svg-source/tray-icon.svg +6 -0
- package/assets/tray-complete.png +0 -0
- package/assets/tray-complete@2x.png +0 -0
- package/assets/tray-completeTemplate.png +0 -0
- package/assets/tray-completeTemplate@2x.png +0 -0
- package/assets/tray-error.png +0 -0
- package/assets/tray-error@2x.png +0 -0
- package/assets/tray-errorTemplate.png +0 -0
- package/assets/tray-errorTemplate@2x.png +0 -0
- package/assets/tray-icon-processing.png +0 -0
- package/assets/tray-icon-processing@2x.png +0 -0
- package/assets/tray-icon-processingTemplate.png +0 -0
- package/assets/tray-icon-processingTemplate@2x.png +0 -0
- package/assets/tray-icon-recording.png +0 -0
- package/assets/tray-icon-recording@2x.png +0 -0
- package/assets/tray-icon-recordingTemplate.png +0 -0
- package/assets/tray-icon-recordingTemplate@2x.png +0 -0
- package/assets/tray-icon.png +0 -0
- package/assets/tray-icon@2x.png +0 -0
- package/assets/tray-iconTemplate.png +0 -0
- package/assets/tray-iconTemplate@2x.png +0 -0
- package/assets/tray-idle.png +0 -0
- package/assets/tray-idle@2x.png +0 -0
- package/assets/tray-idleTemplate.png +0 -0
- package/assets/tray-idleTemplate@2x.png +0 -0
- package/assets/tray-processing-0.png +0 -0
- package/assets/tray-processing-0@2x.png +0 -0
- package/assets/tray-processing-0Template.png +0 -0
- package/assets/tray-processing-0Template@2x.png +0 -0
- package/assets/tray-processing-1.png +0 -0
- package/assets/tray-processing-1@2x.png +0 -0
- package/assets/tray-processing-1Template.png +0 -0
- package/assets/tray-processing-1Template@2x.png +0 -0
- package/assets/tray-processing-2.png +0 -0
- package/assets/tray-processing-2@2x.png +0 -0
- package/assets/tray-processing-2Template.png +0 -0
- package/assets/tray-processing-2Template@2x.png +0 -0
- package/assets/tray-processing-3.png +0 -0
- package/assets/tray-processing-3@2x.png +0 -0
- package/assets/tray-processing-3Template.png +0 -0
- package/assets/tray-processing-3Template@2x.png +0 -0
- package/assets/tray-processing.png +0 -0
- package/assets/tray-processing@2x.png +0 -0
- package/assets/tray-processingTemplate.png +0 -0
- package/assets/tray-processingTemplate@2x.png +0 -0
- package/assets/tray-recording.png +0 -0
- package/assets/tray-recording@2x.png +0 -0
- package/assets/tray-recordingTemplate.png +0 -0
- package/assets/tray-recordingTemplate@2x.png +0 -0
- package/build/DMG_BACKGROUND_SPEC.md +50 -0
- package/build/dmg-background.png +0 -0
- package/build/dmg-background@2x.png +0 -0
- package/build/entitlements.mac.inherit.plist +27 -0
- package/build/entitlements.mac.plist +41 -0
- package/build/favicon-16.png +0 -0
- package/build/favicon-180.png +0 -0
- package/build/favicon-192.png +0 -0
- package/build/favicon-32.png +0 -0
- package/build/favicon-48.png +0 -0
- package/build/favicon-512.png +0 -0
- package/build/favicon-64.png +0 -0
- package/build/icon-128.png +0 -0
- package/build/icon-16.png +0 -0
- package/build/icon-24.png +0 -0
- package/build/icon-256.png +0 -0
- package/build/icon-32.png +0 -0
- package/build/icon-48.png +0 -0
- package/build/icon-64.png +0 -0
- package/build/icon.icns +0 -0
- package/build/icon.ico +0 -0
- package/build/icon.iconset/icon_128x128.png +0 -0
- package/build/icon.iconset/icon_128x128@2x.png +0 -0
- package/build/icon.iconset/icon_16x16.png +0 -0
- package/build/icon.iconset/icon_16x16@2x.png +0 -0
- package/build/icon.iconset/icon_256x256.png +0 -0
- package/build/icon.iconset/icon_256x256@2x.png +0 -0
- package/build/icon.iconset/icon_32x32.png +0 -0
- package/build/icon.iconset/icon_32x32@2x.png +0 -0
- package/build/icon.iconset/icon_512x512.png +0 -0
- package/build/icon.iconset/icon_512x512@2x.png +0 -0
- package/build/icon.png +0 -0
- package/build/installer-header.bmp +0 -0
- package/build/installer-header.png +0 -0
- package/build/installer-sidebar.bmp +0 -0
- package/build/installer-sidebar.png +0 -0
- package/build/installer.nsh +45 -0
- package/build/overlay-processing.png +0 -0
- package/build/overlay-recording.png +0 -0
- package/build/toolbar-record.png +0 -0
- package/build/toolbar-screenshot.png +0 -0
- package/build/toolbar-settings.png +0 -0
- package/build/toolbar-stop.png +0 -0
- package/dist/main/index.mjs +12612 -0
- package/dist/preload/index.mjs +907 -0
- package/dist/renderer/assets/index-CCmUjl9K.js +19495 -0
- package/dist/renderer/assets/index-CUqz_Gs6.css +2270 -0
- package/dist/renderer/index.html +27 -0
- package/docs/AI_AGENT_QUICKSTART.md +42 -0
- package/docs/AI_PIPELINE_DESIGN.md +595 -0
- package/docs/API.md +514 -0
- package/docs/ARCHITECTURE.md +460 -0
- package/docs/CONFIGURATION.md +336 -0
- package/docs/DEVELOPMENT.md +508 -0
- package/docs/EXPORT_FORMATS.md +451 -0
- package/docs/GETTING_STARTED.md +236 -0
- package/docs/KEYBOARD_SHORTCUTS.md +334 -0
- package/docs/TROUBLESHOOTING.md +418 -0
- package/docs/landing/index.html +672 -0
- package/docs/landing/script.js +342 -0
- package/docs/landing/styles.css +1543 -0
- package/electron-builder.yml +140 -0
- package/electron.vite.config.ts +63 -0
- package/package.json +108 -0
- package/railway.json +12 -0
- package/scripts/build.mjs +51 -0
- package/scripts/generate-icons.mjs +314 -0
- package/scripts/generate-installer-images.cjs +253 -0
- package/scripts/generate-tray-icons.mjs +258 -0
- package/scripts/notarize.cjs +180 -0
- package/scripts/one-click-clean-test.sh +147 -0
- package/scripts/postinstall.mjs +36 -0
- package/scripts/setup-markupr.sh +55 -0
- package/setup +17 -0
- package/site/index.html +1835 -0
- package/site/package.json +11 -0
- package/site/railway.json +12 -0
- package/site/server.js +31 -0
- package/src/main/AutoUpdater.ts +392 -0
- package/src/main/CrashRecovery.ts +655 -0
- package/src/main/ErrorHandler.ts +703 -0
- package/src/main/HotkeyManager.ts +399 -0
- package/src/main/MenuManager.ts +529 -0
- package/src/main/PermissionManager.ts +420 -0
- package/src/main/SessionController.ts +1465 -0
- package/src/main/TrayManager.ts +540 -0
- package/src/main/ai/AIPipelineManager.ts +199 -0
- package/src/main/ai/ClaudeAnalyzer.ts +339 -0
- package/src/main/ai/ImageOptimizer.ts +176 -0
- package/src/main/ai/StructuredMarkdownBuilder.ts +379 -0
- package/src/main/ai/index.ts +16 -0
- package/src/main/ai/types.ts +258 -0
- package/src/main/analysis/ClarificationGenerator.ts +385 -0
- package/src/main/analysis/FeedbackAnalyzer.ts +531 -0
- package/src/main/analysis/index.ts +19 -0
- package/src/main/audio/AudioCapture.ts +978 -0
- package/src/main/audio/audioUtils.ts +100 -0
- package/src/main/audio/index.ts +20 -0
- package/src/main/capture/index.ts +1 -0
- package/src/main/index.ts +1693 -0
- package/src/main/ipc/captureHandlers.ts +272 -0
- package/src/main/ipc/index.ts +45 -0
- package/src/main/ipc/outputHandlers.ts +302 -0
- package/src/main/ipc/sessionHandlers.ts +56 -0
- package/src/main/ipc/settingsHandlers.ts +471 -0
- package/src/main/ipc/types.ts +56 -0
- package/src/main/ipc/windowHandlers.ts +277 -0
- package/src/main/output/ClipboardService.ts +369 -0
- package/src/main/output/ExportService.ts +539 -0
- package/src/main/output/FileManager.ts +416 -0
- package/src/main/output/MarkdownGenerator.ts +791 -0
- package/src/main/output/MarkdownPatcher.ts +299 -0
- package/src/main/output/index.ts +186 -0
- package/src/main/output/sessionAdapter.ts +207 -0
- package/src/main/output/templates/html-template.ts +553 -0
- package/src/main/pipeline/FrameExtractor.ts +330 -0
- package/src/main/pipeline/PostProcessor.ts +399 -0
- package/src/main/pipeline/TranscriptAnalyzer.ts +226 -0
- package/src/main/pipeline/index.ts +36 -0
- package/src/main/platform/WindowsTaskbar.ts +600 -0
- package/src/main/platform/index.ts +16 -0
- package/src/main/settings/SettingsManager.ts +730 -0
- package/src/main/settings/index.ts +19 -0
- package/src/main/transcription/ModelDownloadManager.ts +494 -0
- package/src/main/transcription/TierManager.ts +219 -0
- package/src/main/transcription/TranscriptionRecoveryService.ts +340 -0
- package/src/main/transcription/WhisperService.ts +748 -0
- package/src/main/transcription/index.ts +56 -0
- package/src/main/transcription/types.ts +135 -0
- package/src/main/windows/PopoverManager.ts +284 -0
- package/src/main/windows/TaskbarIntegration.ts +452 -0
- package/src/main/windows/index.ts +23 -0
- package/src/preload/index.ts +1047 -0
- package/src/renderer/App.tsx +515 -0
- package/src/renderer/AppWrapper.tsx +28 -0
- package/src/renderer/assets/logo-dark.svg +7 -0
- package/src/renderer/assets/logo.svg +7 -0
- package/src/renderer/audio/AudioCaptureRenderer.ts +454 -0
- package/src/renderer/capture/ScreenRecordingRenderer.ts +492 -0
- package/src/renderer/components/AnnotationOverlay.tsx +836 -0
- package/src/renderer/components/AudioWaveform.tsx +811 -0
- package/src/renderer/components/ClarificationQuestions.tsx +656 -0
- package/src/renderer/components/CountdownTimer.tsx +495 -0
- package/src/renderer/components/CrashRecoveryDialog.tsx +632 -0
- package/src/renderer/components/DonateButton.tsx +127 -0
- package/src/renderer/components/ErrorBoundary.tsx +308 -0
- package/src/renderer/components/ExportDialog.tsx +872 -0
- package/src/renderer/components/HotkeyHint.tsx +261 -0
- package/src/renderer/components/KeyboardShortcuts.tsx +787 -0
- package/src/renderer/components/ModelDownloadDialog.tsx +844 -0
- package/src/renderer/components/Onboarding.tsx +1830 -0
- package/src/renderer/components/ProcessingOverlay.tsx +157 -0
- package/src/renderer/components/RecordingOverlay.tsx +423 -0
- package/src/renderer/components/SessionHistory.tsx +1746 -0
- package/src/renderer/components/SessionReview.tsx +1321 -0
- package/src/renderer/components/SettingsPanel.tsx +217 -0
- package/src/renderer/components/Skeleton.tsx +347 -0
- package/src/renderer/components/StatusIndicator.tsx +86 -0
- package/src/renderer/components/ThemeProvider.tsx +429 -0
- package/src/renderer/components/Tooltip.tsx +370 -0
- package/src/renderer/components/TranscriptionPreview.tsx +183 -0
- package/src/renderer/components/TranscriptionTierSelector.tsx +640 -0
- package/src/renderer/components/UpdateNotification.tsx +377 -0
- package/src/renderer/components/WindowSelector.tsx +947 -0
- package/src/renderer/components/index.ts +99 -0
- package/src/renderer/components/primitives/ApiKeyInput.tsx +98 -0
- package/src/renderer/components/primitives/ColorPicker.tsx +65 -0
- package/src/renderer/components/primitives/DangerButton.tsx +45 -0
- package/src/renderer/components/primitives/DirectoryPicker.tsx +41 -0
- package/src/renderer/components/primitives/Dropdown.tsx +34 -0
- package/src/renderer/components/primitives/KeyRecorder.tsx +117 -0
- package/src/renderer/components/primitives/SettingsSection.tsx +32 -0
- package/src/renderer/components/primitives/Slider.tsx +43 -0
- package/src/renderer/components/primitives/Toggle.tsx +36 -0
- package/src/renderer/components/primitives/index.ts +10 -0
- package/src/renderer/components/settings/AdvancedTab.tsx +174 -0
- package/src/renderer/components/settings/AppearanceTab.tsx +77 -0
- package/src/renderer/components/settings/GeneralTab.tsx +40 -0
- package/src/renderer/components/settings/HotkeysTab.tsx +79 -0
- package/src/renderer/components/settings/RecordingTab.tsx +84 -0
- package/src/renderer/components/settings/index.ts +9 -0
- package/src/renderer/components/settings/settingsStyles.ts +673 -0
- package/src/renderer/components/settings/tabConfig.tsx +85 -0
- package/src/renderer/components/settings/useSettingsPanel.ts +447 -0
- package/src/renderer/contexts/ProcessingContext.tsx +227 -0
- package/src/renderer/contexts/RecordingContext.tsx +683 -0
- package/src/renderer/contexts/UIContext.tsx +326 -0
- package/src/renderer/contexts/index.ts +24 -0
- package/src/renderer/donateMessages.ts +69 -0
- package/src/renderer/hooks/index.ts +75 -0
- package/src/renderer/hooks/useAnimation.tsx +544 -0
- package/src/renderer/hooks/useTheme.ts +313 -0
- package/src/renderer/index.html +26 -0
- package/src/renderer/main.tsx +52 -0
- package/src/renderer/styles/animations.css +1093 -0
- package/src/renderer/styles/app-shell.css +662 -0
- package/src/renderer/styles/globals.css +515 -0
- package/src/renderer/styles/theme.ts +578 -0
- package/src/renderer/types/electron.d.ts +385 -0
- package/src/shared/hotkeys.ts +283 -0
- package/src/shared/types.ts +809 -0
- package/tests/clipboard.test.ts +228 -0
- package/tests/e2e/criticalPaths.test.ts +594 -0
- package/tests/feedbackAnalyzer.test.ts +303 -0
- package/tests/integration/sessionFlow.test.ts +583 -0
- package/tests/markdownGenerator.test.ts +418 -0
- package/tests/output.test.ts +96 -0
- package/tests/setup.ts +486 -0
- package/tests/unit/appIntegration.test.ts +676 -0
- package/tests/unit/appViewState.test.ts +281 -0
- package/tests/unit/audioIpcChannels.test.ts +17 -0
- package/tests/unit/exportService.test.ts +492 -0
- package/tests/unit/hotkeys.test.ts +92 -0
- package/tests/unit/navigationPreload.test.ts +94 -0
- package/tests/unit/onboardingFlow.test.ts +345 -0
- package/tests/unit/permissionManager.test.ts +175 -0
- package/tests/unit/permissionManagerExpanded.test.ts +296 -0
- package/tests/unit/screenRecordingRenderer.test.ts +368 -0
- package/tests/unit/sessionController.test.ts +515 -0
- package/tests/unit/tierManager.test.ts +61 -0
- package/tests/unit/tierManagerExpanded.test.ts +142 -0
- package/tests/unit/transcriptAnalyzer.test.ts +64 -0
- package/tsconfig.json +25 -0
- package/vitest.config.ts +46 -0
|
@@ -0,0 +1,219 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* TierManager.ts - Transcription Tier Selection (Post-Process Architecture)
|
|
3
|
+
*
|
|
4
|
+
* Simplified tier system for post-session transcription:
|
|
5
|
+
* - Tier 1: Local Whisper (default, batch transcription after recording)
|
|
6
|
+
* - Tier 2: Timer-only (fallback, no transcription)
|
|
7
|
+
*
|
|
8
|
+
* In the post-process architecture, transcription no longer happens during
|
|
9
|
+
* recording. TierManager tracks tier availability for the UI and provides
|
|
10
|
+
* tier preference selection for post-session processing.
|
|
11
|
+
*/
|
|
12
|
+
|
|
13
|
+
import { EventEmitter } from 'events';
|
|
14
|
+
import * as os from 'os';
|
|
15
|
+
import { modelDownloadManager } from './ModelDownloadManager';
|
|
16
|
+
import { getSettingsManager } from '../settings';
|
|
17
|
+
import type {
|
|
18
|
+
TranscriptionTier,
|
|
19
|
+
WhisperModel,
|
|
20
|
+
TierStatus,
|
|
21
|
+
TierQuality,
|
|
22
|
+
} from './types';
|
|
23
|
+
|
|
24
|
+
// ============================================================================
|
|
25
|
+
// Constants
|
|
26
|
+
// ============================================================================
|
|
27
|
+
|
|
28
|
+
const TIER_PRIORITY: TranscriptionTier[] = ['whisper', 'timer-only'];
|
|
29
|
+
|
|
30
|
+
const TIER_QUALITY: Record<TranscriptionTier, TierQuality> = {
|
|
31
|
+
whisper: { accuracy: '90%+', latency: 'Post-session' },
|
|
32
|
+
'timer-only': { accuracy: 'N/A', latency: 'N/A' },
|
|
33
|
+
};
|
|
34
|
+
|
|
35
|
+
// Minimum memory for Whisper (2GB)
|
|
36
|
+
const WHISPER_MIN_MEMORY = 2 * 1024 * 1024 * 1024;
|
|
37
|
+
|
|
38
|
+
const MODEL_MEMORY_REQUIREMENT_BYTES: Record<WhisperModel, number> = {
|
|
39
|
+
tiny: 450 * 1024 * 1024,
|
|
40
|
+
base: 800 * 1024 * 1024,
|
|
41
|
+
small: 1400 * 1024 * 1024,
|
|
42
|
+
medium: 2800 * 1024 * 1024,
|
|
43
|
+
large: 5200 * 1024 * 1024,
|
|
44
|
+
};
|
|
45
|
+
|
|
46
|
+
type PreferredTier = 'auto' | TranscriptionTier;
|
|
47
|
+
|
|
48
|
+
// ============================================================================
|
|
49
|
+
// TierManager Class
|
|
50
|
+
// ============================================================================
|
|
51
|
+
|
|
52
|
+
export class TierManager extends EventEmitter {
|
|
53
|
+
private currentTier: TranscriptionTier | null = null;
|
|
54
|
+
private preferredTier: PreferredTier = 'auto';
|
|
55
|
+
|
|
56
|
+
// ============================================================================
|
|
57
|
+
// Public API
|
|
58
|
+
// ============================================================================
|
|
59
|
+
|
|
60
|
+
/**
|
|
61
|
+
* Get the status of all tiers
|
|
62
|
+
*/
|
|
63
|
+
async getTierStatuses(): Promise<TierStatus[]> {
|
|
64
|
+
const [whisperStatus, timerStatus] = await Promise.all([
|
|
65
|
+
this.checkWhisperAvailability(),
|
|
66
|
+
this.checkTimerOnlyAvailability(),
|
|
67
|
+
]);
|
|
68
|
+
|
|
69
|
+
return [whisperStatus, timerStatus];
|
|
70
|
+
}
|
|
71
|
+
|
|
72
|
+
/**
|
|
73
|
+
* Get the currently active tier
|
|
74
|
+
*/
|
|
75
|
+
getCurrentTier(): TranscriptionTier | null {
|
|
76
|
+
return this.currentTier;
|
|
77
|
+
}
|
|
78
|
+
|
|
79
|
+
/**
|
|
80
|
+
* Get preferred tier selection. 'auto' means dynamic best-available choice.
|
|
81
|
+
*/
|
|
82
|
+
getPreferredTier(): PreferredTier {
|
|
83
|
+
return this.preferredTier;
|
|
84
|
+
}
|
|
85
|
+
|
|
86
|
+
/**
|
|
87
|
+
* Set preferred tier selection used for post-session transcription.
|
|
88
|
+
* Only transcription-capable tiers are accepted.
|
|
89
|
+
*/
|
|
90
|
+
setPreferredTier(tier: PreferredTier): void {
|
|
91
|
+
if (tier !== 'auto' && !this.tierProvidesTranscription(tier)) {
|
|
92
|
+
throw new Error(
|
|
93
|
+
'This tier does not provide transcription. Select Whisper or Auto.'
|
|
94
|
+
);
|
|
95
|
+
}
|
|
96
|
+
|
|
97
|
+
this.preferredTier = tier;
|
|
98
|
+
this.log(`Preferred tier set to: ${tier}`);
|
|
99
|
+
}
|
|
100
|
+
|
|
101
|
+
/**
|
|
102
|
+
* Get quality info for a tier
|
|
103
|
+
*/
|
|
104
|
+
getTierQuality(tier: TranscriptionTier): TierQuality {
|
|
105
|
+
return TIER_QUALITY[tier];
|
|
106
|
+
}
|
|
107
|
+
|
|
108
|
+
/**
|
|
109
|
+
* Check if a tier actually provides transcription
|
|
110
|
+
*/
|
|
111
|
+
tierProvidesTranscription(tier: TranscriptionTier): boolean {
|
|
112
|
+
return tier === 'whisper';
|
|
113
|
+
}
|
|
114
|
+
|
|
115
|
+
/**
|
|
116
|
+
* Check if we have any tier that can actually transcribe.
|
|
117
|
+
* Considers both local Whisper and cloud OpenAI as valid paths.
|
|
118
|
+
*/
|
|
119
|
+
async hasTranscriptionCapability(): Promise<boolean> {
|
|
120
|
+
const statuses = await this.getTierStatuses();
|
|
121
|
+
const hasLocalTier = statuses.some(
|
|
122
|
+
(s) => s.available && this.tierProvidesTranscription(s.tier)
|
|
123
|
+
);
|
|
124
|
+
if (hasLocalTier) {
|
|
125
|
+
return true;
|
|
126
|
+
}
|
|
127
|
+
|
|
128
|
+
// Post-session OpenAI transcription is also a valid capability path.
|
|
129
|
+
try {
|
|
130
|
+
const settings = getSettingsManager();
|
|
131
|
+
const openAiKey = await settings.getApiKey('openai');
|
|
132
|
+
return Boolean(openAiKey?.trim());
|
|
133
|
+
} catch {
|
|
134
|
+
return false;
|
|
135
|
+
}
|
|
136
|
+
}
|
|
137
|
+
|
|
138
|
+
/**
|
|
139
|
+
* Get all tier qualities
|
|
140
|
+
*/
|
|
141
|
+
getAllTierQualities(): Record<TranscriptionTier, TierQuality> {
|
|
142
|
+
return { ...TIER_QUALITY };
|
|
143
|
+
}
|
|
144
|
+
|
|
145
|
+
/**
|
|
146
|
+
* Select the best available tier.
|
|
147
|
+
* Respects user preference when available.
|
|
148
|
+
*/
|
|
149
|
+
async selectBestTier(): Promise<TranscriptionTier> {
|
|
150
|
+
const statuses = await this.getTierStatuses();
|
|
151
|
+
|
|
152
|
+
if (this.preferredTier !== 'auto') {
|
|
153
|
+
const preferredStatus = statuses.find((s) => s.tier === this.preferredTier);
|
|
154
|
+
if (preferredStatus?.available) {
|
|
155
|
+
return this.preferredTier as TranscriptionTier;
|
|
156
|
+
}
|
|
157
|
+
|
|
158
|
+
this.log(
|
|
159
|
+
`Preferred tier "${this.preferredTier}" unavailable, using automatic fallover`
|
|
160
|
+
);
|
|
161
|
+
}
|
|
162
|
+
|
|
163
|
+
for (const tier of TIER_PRIORITY) {
|
|
164
|
+
const status = statuses.find((s) => s.tier === tier);
|
|
165
|
+
if (status?.available) {
|
|
166
|
+
return tier;
|
|
167
|
+
}
|
|
168
|
+
}
|
|
169
|
+
|
|
170
|
+
// Should never reach here - timer-only is always available
|
|
171
|
+
return 'timer-only';
|
|
172
|
+
}
|
|
173
|
+
|
|
174
|
+
// ============================================================================
|
|
175
|
+
// Tier Availability Checks
|
|
176
|
+
// ============================================================================
|
|
177
|
+
|
|
178
|
+
private async checkWhisperAvailability(): Promise<TierStatus> {
|
|
179
|
+
if (!modelDownloadManager.hasAnyModel()) {
|
|
180
|
+
return { tier: 'whisper', available: false, reason: 'Model not downloaded' };
|
|
181
|
+
}
|
|
182
|
+
|
|
183
|
+
const selectedModel = modelDownloadManager.getDefaultModel();
|
|
184
|
+
const requiredMemory = MODEL_MEMORY_REQUIREMENT_BYTES[selectedModel] ?? WHISPER_MIN_MEMORY;
|
|
185
|
+
|
|
186
|
+
const freeMemory = os.freemem();
|
|
187
|
+
if (freeMemory < requiredMemory) {
|
|
188
|
+
return {
|
|
189
|
+
tier: 'whisper',
|
|
190
|
+
available: false,
|
|
191
|
+
reason:
|
|
192
|
+
`Insufficient memory for ${selectedModel} model ` +
|
|
193
|
+
`(${Math.round(freeMemory / 1024 / 1024)}MB free, need ~${Math.round(requiredMemory / 1024 / 1024)}MB)`,
|
|
194
|
+
};
|
|
195
|
+
}
|
|
196
|
+
|
|
197
|
+
return { tier: 'whisper', available: true };
|
|
198
|
+
}
|
|
199
|
+
|
|
200
|
+
private async checkTimerOnlyAvailability(): Promise<TierStatus> {
|
|
201
|
+
// Timer-only is always available
|
|
202
|
+
return { tier: 'timer-only', available: true };
|
|
203
|
+
}
|
|
204
|
+
|
|
205
|
+
// ============================================================================
|
|
206
|
+
// Logging
|
|
207
|
+
// ============================================================================
|
|
208
|
+
|
|
209
|
+
private log(message: string): void {
|
|
210
|
+
console.log(`[TierManager] ${message}`);
|
|
211
|
+
}
|
|
212
|
+
}
|
|
213
|
+
|
|
214
|
+
// ============================================================================
|
|
215
|
+
// Singleton Export
|
|
216
|
+
// ============================================================================
|
|
217
|
+
|
|
218
|
+
export const tierManager = new TierManager();
|
|
219
|
+
export default TierManager;
|
|
@@ -0,0 +1,340 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* TranscriptionRecoveryService
|
|
3
|
+
*
|
|
4
|
+
* Handles post-session transcription recovery when live transcription
|
|
5
|
+
* produces no output. Tries OpenAI Whisper-1 API first, then falls back
|
|
6
|
+
* to local Whisper. Extracted from SessionController for separation of concerns.
|
|
7
|
+
*/
|
|
8
|
+
|
|
9
|
+
import type { CapturedAudioAsset } from '../audio/AudioCapture';
|
|
10
|
+
import { extensionFromMimeType } from '../audio/audioUtils';
|
|
11
|
+
import { getSettingsManager } from '../settings';
|
|
12
|
+
import { whisperService } from './WhisperService';
|
|
13
|
+
import type { TranscriptEvent } from './types';
|
|
14
|
+
|
|
15
|
+
// =============================================================================
|
|
16
|
+
// Configuration
|
|
17
|
+
// =============================================================================
|
|
18
|
+
|
|
19
|
+
const WHISPER_RECOVERY_CHUNK_SECONDS = 30;
|
|
20
|
+
const MAX_POST_SESSION_LOCAL_RECOVERY_DURATION_SEC = 8 * 60;
|
|
21
|
+
|
|
22
|
+
// =============================================================================
|
|
23
|
+
// Types
|
|
24
|
+
// =============================================================================
|
|
25
|
+
|
|
26
|
+
/**
|
|
27
|
+
* Audio data needed for recovery.
|
|
28
|
+
* Provided by the SessionController from its audio capture service.
|
|
29
|
+
*/
|
|
30
|
+
export interface RecoveryAudioData {
|
|
31
|
+
/** Encoded audio asset (webm/ogg/mp4). Used by OpenAI API. */
|
|
32
|
+
capturedAudioAsset: CapturedAudioAsset | null;
|
|
33
|
+
/** Raw PCM Float32 buffer. Used by local Whisper. */
|
|
34
|
+
capturedAudioBuffer: Buffer | null;
|
|
35
|
+
}
|
|
36
|
+
|
|
37
|
+
// =============================================================================
|
|
38
|
+
// Pure Helper Functions
|
|
39
|
+
// =============================================================================
|
|
40
|
+
|
|
41
|
+
/**
|
|
42
|
+
* Normalize a transcript timestamp to epoch seconds.
|
|
43
|
+
* Relative offsets (< 1 day) are rebased to session start.
|
|
44
|
+
*/
|
|
45
|
+
export function normalizeTranscriptTimestamp(timestamp: number, sessionStartSec: number): number {
|
|
46
|
+
if (timestamp < 86_400) {
|
|
47
|
+
return sessionStartSec + Math.max(0, timestamp);
|
|
48
|
+
}
|
|
49
|
+
if (timestamp < sessionStartSec - 60) {
|
|
50
|
+
return sessionStartSec + Math.max(0, timestamp);
|
|
51
|
+
}
|
|
52
|
+
return timestamp;
|
|
53
|
+
}
|
|
54
|
+
|
|
55
|
+
/**
|
|
56
|
+
* Extract a user-friendly error message from an OpenAI API error response.
|
|
57
|
+
*/
|
|
58
|
+
async function extractOpenAiError(response: Response): Promise<string> {
|
|
59
|
+
try {
|
|
60
|
+
const raw = await response.text();
|
|
61
|
+
const trimmed = raw.trim();
|
|
62
|
+
if (trimmed.length === 0) {
|
|
63
|
+
return 'Unknown API error';
|
|
64
|
+
}
|
|
65
|
+
|
|
66
|
+
const parsed = JSON.parse(trimmed) as { error?: { message?: string } };
|
|
67
|
+
const message = parsed?.error?.message;
|
|
68
|
+
if (message && message.trim().length > 0) {
|
|
69
|
+
return message.trim();
|
|
70
|
+
}
|
|
71
|
+
return trimmed.length > 220 ? `${trimmed.slice(0, 220)}...` : trimmed;
|
|
72
|
+
} catch {
|
|
73
|
+
return `HTTP ${response.status}`;
|
|
74
|
+
}
|
|
75
|
+
}
|
|
76
|
+
|
|
77
|
+
/**
|
|
78
|
+
* Read the OpenAI API key from secure storage.
|
|
79
|
+
*/
|
|
80
|
+
async function getOpenAIApiKey(): Promise<string | null> {
|
|
81
|
+
try {
|
|
82
|
+
const settings = getSettingsManager();
|
|
83
|
+
const apiKey = await settings.getApiKey('openai');
|
|
84
|
+
const normalized = apiKey?.trim();
|
|
85
|
+
return normalized && normalized.length > 0 ? normalized : null;
|
|
86
|
+
} catch (error) {
|
|
87
|
+
console.warn('[TranscriptionRecovery] Failed to read OpenAI API key:', error);
|
|
88
|
+
return null;
|
|
89
|
+
}
|
|
90
|
+
}
|
|
91
|
+
|
|
92
|
+
// =============================================================================
|
|
93
|
+
// Recovery Strategies
|
|
94
|
+
// =============================================================================
|
|
95
|
+
|
|
96
|
+
/**
|
|
97
|
+
* Recover transcript via OpenAI Whisper-1 API from an encoded audio asset.
|
|
98
|
+
*/
|
|
99
|
+
async function recoverWithOpenAI(
|
|
100
|
+
audioAsset: CapturedAudioAsset,
|
|
101
|
+
sessionStartSec: number,
|
|
102
|
+
apiKey: string,
|
|
103
|
+
maxAttempts: number,
|
|
104
|
+
): Promise<TranscriptEvent[]> {
|
|
105
|
+
for (let attempt = 1; attempt <= maxAttempts; attempt++) {
|
|
106
|
+
try {
|
|
107
|
+
const controller = new AbortController();
|
|
108
|
+
const timeoutMs = Math.min(180_000, Math.max(30_000, Math.round(audioAsset.durationMs * 1.8)));
|
|
109
|
+
const timeout = setTimeout(() => controller.abort(), timeoutMs);
|
|
110
|
+
|
|
111
|
+
const recoveredEvents: TranscriptEvent[] = [];
|
|
112
|
+
|
|
113
|
+
try {
|
|
114
|
+
const extension = extensionFromMimeType(audioAsset.mimeType);
|
|
115
|
+
const form = new FormData();
|
|
116
|
+
form.append('model', 'whisper-1');
|
|
117
|
+
form.append('response_format', 'verbose_json');
|
|
118
|
+
form.append('temperature', '0');
|
|
119
|
+
form.append(
|
|
120
|
+
'file',
|
|
121
|
+
new Blob([new Uint8Array(audioAsset.buffer)], { type: audioAsset.mimeType }),
|
|
122
|
+
`session-audio${extension}`,
|
|
123
|
+
);
|
|
124
|
+
|
|
125
|
+
const response = await fetch('https://api.openai.com/v1/audio/transcriptions', {
|
|
126
|
+
method: 'POST',
|
|
127
|
+
headers: {
|
|
128
|
+
Authorization: `Bearer ${apiKey}`,
|
|
129
|
+
},
|
|
130
|
+
body: form,
|
|
131
|
+
signal: controller.signal,
|
|
132
|
+
});
|
|
133
|
+
|
|
134
|
+
if (!response.ok) {
|
|
135
|
+
const detail = await extractOpenAiError(response);
|
|
136
|
+
throw new Error(`OpenAI transcription failed (${response.status}): ${detail}`);
|
|
137
|
+
}
|
|
138
|
+
|
|
139
|
+
const payload = (await response.json()) as {
|
|
140
|
+
text?: string;
|
|
141
|
+
segments?: Array<{
|
|
142
|
+
text?: string;
|
|
143
|
+
start?: number;
|
|
144
|
+
}>;
|
|
145
|
+
};
|
|
146
|
+
|
|
147
|
+
const segments = Array.isArray(payload.segments) ? payload.segments : [];
|
|
148
|
+
if (segments.length > 0) {
|
|
149
|
+
for (const segment of segments) {
|
|
150
|
+
const text = segment.text?.trim();
|
|
151
|
+
if (!text) {
|
|
152
|
+
continue;
|
|
153
|
+
}
|
|
154
|
+
|
|
155
|
+
const start = Number.isFinite(segment.start) ? Math.max(0, Number(segment.start)) : 0;
|
|
156
|
+
const normalizedTimestamp = normalizeTranscriptTimestamp(sessionStartSec + start, sessionStartSec);
|
|
157
|
+
recoveredEvents.push({
|
|
158
|
+
text,
|
|
159
|
+
isFinal: true,
|
|
160
|
+
confidence: 0.9,
|
|
161
|
+
timestamp: normalizedTimestamp,
|
|
162
|
+
tier: 'whisper',
|
|
163
|
+
});
|
|
164
|
+
}
|
|
165
|
+
} else if (payload.text?.trim()) {
|
|
166
|
+
recoveredEvents.push({
|
|
167
|
+
text: payload.text.trim(),
|
|
168
|
+
isFinal: true,
|
|
169
|
+
confidence: 0.85,
|
|
170
|
+
timestamp: normalizeTranscriptTimestamp(sessionStartSec, sessionStartSec),
|
|
171
|
+
tier: 'whisper',
|
|
172
|
+
});
|
|
173
|
+
}
|
|
174
|
+
} finally {
|
|
175
|
+
clearTimeout(timeout);
|
|
176
|
+
}
|
|
177
|
+
|
|
178
|
+
if (recoveredEvents.length === 0) {
|
|
179
|
+
throw new Error('No transcript text recovered from OpenAI transcription');
|
|
180
|
+
}
|
|
181
|
+
|
|
182
|
+
console.log(
|
|
183
|
+
`[TranscriptionRecovery] Recovered ${recoveredEvents.length} segments via OpenAI (attempt ${attempt}/${maxAttempts}).`,
|
|
184
|
+
);
|
|
185
|
+
return recoveredEvents;
|
|
186
|
+
} catch (error) {
|
|
187
|
+
const message = error instanceof Error ? error.message : String(error);
|
|
188
|
+
console.warn(
|
|
189
|
+
`[TranscriptionRecovery] OpenAI recovery attempt ${attempt}/${maxAttempts} failed: ${message}`,
|
|
190
|
+
);
|
|
191
|
+
|
|
192
|
+
if (attempt < maxAttempts) {
|
|
193
|
+
const delayMs = 500 * attempt;
|
|
194
|
+
await new Promise((resolve) => setTimeout(resolve, delayMs));
|
|
195
|
+
}
|
|
196
|
+
}
|
|
197
|
+
}
|
|
198
|
+
|
|
199
|
+
return [];
|
|
200
|
+
}
|
|
201
|
+
|
|
202
|
+
/**
|
|
203
|
+
* Recover transcript via local Whisper from raw PCM audio samples.
|
|
204
|
+
*/
|
|
205
|
+
async function recoverWithWhisper(
|
|
206
|
+
audioSamples: Float32Array,
|
|
207
|
+
sessionStartSec: number,
|
|
208
|
+
maxAttempts: number,
|
|
209
|
+
): Promise<TranscriptEvent[]> {
|
|
210
|
+
const sampleRate = 16000;
|
|
211
|
+
const chunkSamples = sampleRate * WHISPER_RECOVERY_CHUNK_SECONDS;
|
|
212
|
+
|
|
213
|
+
for (let attempt = 1; attempt <= maxAttempts; attempt++) {
|
|
214
|
+
try {
|
|
215
|
+
const recoveredSegments: Array<{
|
|
216
|
+
text: string;
|
|
217
|
+
startTime: number;
|
|
218
|
+
endTime: number;
|
|
219
|
+
confidence: number;
|
|
220
|
+
}> = [];
|
|
221
|
+
for (let offset = 0; offset < audioSamples.length; offset += chunkSamples) {
|
|
222
|
+
const chunk = audioSamples.subarray(offset, Math.min(audioSamples.length, offset + chunkSamples));
|
|
223
|
+
const chunkStartSec = sessionStartSec + offset / sampleRate;
|
|
224
|
+
const chunkSegments = await whisperService.transcribeSamples(chunk, chunkStartSec);
|
|
225
|
+
recoveredSegments.push(...chunkSegments);
|
|
226
|
+
|
|
227
|
+
// Yield between chunks to keep the app responsive during longer sessions.
|
|
228
|
+
if (offset + chunkSamples < audioSamples.length) {
|
|
229
|
+
await new Promise((resolve) => setTimeout(resolve, 0));
|
|
230
|
+
}
|
|
231
|
+
}
|
|
232
|
+
|
|
233
|
+
const recoveredEvents: TranscriptEvent[] = recoveredSegments
|
|
234
|
+
.map((segment) => ({
|
|
235
|
+
text: segment.text,
|
|
236
|
+
isFinal: true as const,
|
|
237
|
+
confidence: segment.confidence,
|
|
238
|
+
timestamp: normalizeTranscriptTimestamp(segment.startTime, sessionStartSec),
|
|
239
|
+
tier: 'whisper' as const,
|
|
240
|
+
}))
|
|
241
|
+
.filter((segment) => segment.text.trim().length > 0);
|
|
242
|
+
|
|
243
|
+
if (recoveredEvents.length === 0) {
|
|
244
|
+
throw new Error('No transcript text recovered from captured audio');
|
|
245
|
+
}
|
|
246
|
+
|
|
247
|
+
console.log(
|
|
248
|
+
`[TranscriptionRecovery] Recovered ${recoveredEvents.length} segments via Whisper (attempt ${attempt}/${maxAttempts}).`,
|
|
249
|
+
);
|
|
250
|
+
return recoveredEvents;
|
|
251
|
+
} catch (error) {
|
|
252
|
+
const message = error instanceof Error ? error.message : String(error);
|
|
253
|
+
console.warn(
|
|
254
|
+
`[TranscriptionRecovery] Whisper recovery attempt ${attempt}/${maxAttempts} failed: ${message}`,
|
|
255
|
+
);
|
|
256
|
+
|
|
257
|
+
if (attempt < maxAttempts) {
|
|
258
|
+
const delayMs = 400 * attempt;
|
|
259
|
+
await new Promise((resolve) => setTimeout(resolve, delayMs));
|
|
260
|
+
}
|
|
261
|
+
}
|
|
262
|
+
}
|
|
263
|
+
|
|
264
|
+
return [];
|
|
265
|
+
}
|
|
266
|
+
|
|
267
|
+
// =============================================================================
|
|
268
|
+
// Main Recovery Orchestrator
|
|
269
|
+
// =============================================================================
|
|
270
|
+
|
|
271
|
+
/**
|
|
272
|
+
* Run post-session transcription recovery.
|
|
273
|
+
*
|
|
274
|
+
* Attempts OpenAI API first, then falls back to local Whisper.
|
|
275
|
+
* Returns recovered transcript events, or an empty array if all strategies fail.
|
|
276
|
+
*
|
|
277
|
+
* @param sessionStartSec - Session start time in epoch seconds
|
|
278
|
+
* @param audioData - Audio data from the capture service
|
|
279
|
+
* @returns Recovered transcript events (may be empty)
|
|
280
|
+
*/
|
|
281
|
+
export async function recoverTranscript(
|
|
282
|
+
sessionStartSec: number,
|
|
283
|
+
audioData: RecoveryAudioData,
|
|
284
|
+
): Promise<TranscriptEvent[]> {
|
|
285
|
+
// Try OpenAI first (best quality)
|
|
286
|
+
if (audioData.capturedAudioAsset && audioData.capturedAudioAsset.buffer.byteLength > 0) {
|
|
287
|
+
const openAiApiKey = await getOpenAIApiKey();
|
|
288
|
+
if (openAiApiKey) {
|
|
289
|
+
const openAiRecovered = await recoverWithOpenAI(
|
|
290
|
+
audioData.capturedAudioAsset,
|
|
291
|
+
sessionStartSec,
|
|
292
|
+
openAiApiKey,
|
|
293
|
+
2,
|
|
294
|
+
);
|
|
295
|
+
if (openAiRecovered.length > 0) {
|
|
296
|
+
return openAiRecovered;
|
|
297
|
+
}
|
|
298
|
+
} else {
|
|
299
|
+
console.warn('[TranscriptionRecovery] OpenAI recovery skipped: API key not configured.');
|
|
300
|
+
}
|
|
301
|
+
} else {
|
|
302
|
+
console.warn('[TranscriptionRecovery] OpenAI recovery skipped: no captured audio asset.');
|
|
303
|
+
}
|
|
304
|
+
|
|
305
|
+
// Fall back to local Whisper (raw PCM only)
|
|
306
|
+
if (!audioData.capturedAudioBuffer || audioData.capturedAudioBuffer.byteLength === 0) {
|
|
307
|
+
console.warn('[TranscriptionRecovery] Whisper recovery skipped: captured audio is encoded-only.');
|
|
308
|
+
return [];
|
|
309
|
+
}
|
|
310
|
+
|
|
311
|
+
const audioSamples = new Float32Array(
|
|
312
|
+
audioData.capturedAudioBuffer.buffer,
|
|
313
|
+
audioData.capturedAudioBuffer.byteOffset,
|
|
314
|
+
audioData.capturedAudioBuffer.byteLength / 4,
|
|
315
|
+
);
|
|
316
|
+
if (audioSamples.length === 0) {
|
|
317
|
+
return [];
|
|
318
|
+
}
|
|
319
|
+
|
|
320
|
+
const audioDurationSec = audioSamples.length / 16000;
|
|
321
|
+
if (audioDurationSec > MAX_POST_SESSION_LOCAL_RECOVERY_DURATION_SEC) {
|
|
322
|
+
console.warn(
|
|
323
|
+
`[TranscriptionRecovery] Whisper recovery skipped for long session (${Math.round(audioDurationSec)}s).`,
|
|
324
|
+
);
|
|
325
|
+
return [];
|
|
326
|
+
}
|
|
327
|
+
|
|
328
|
+
if (!whisperService.isModelAvailable()) {
|
|
329
|
+
console.warn('[TranscriptionRecovery] Whisper recovery skipped: no local model available.');
|
|
330
|
+
return [];
|
|
331
|
+
}
|
|
332
|
+
|
|
333
|
+
const whisperRecovered = await recoverWithWhisper(audioSamples, sessionStartSec, 3);
|
|
334
|
+
if (whisperRecovered.length > 0) {
|
|
335
|
+
return whisperRecovered;
|
|
336
|
+
}
|
|
337
|
+
|
|
338
|
+
console.warn('[TranscriptionRecovery] All recovery strategies exhausted without transcript output.');
|
|
339
|
+
return [];
|
|
340
|
+
}
|