PyPI - PayPerTranscript - Versions diffs - 0.2.0__py3-none-any.whl - Mend

PayPerTranscript 0.2.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (40) hide show

paypertranscript/__init__.py +3 -0
paypertranscript/__main__.py +51 -0
paypertranscript/assets/icons/app.ico +0 -0
paypertranscript/assets/icons/app.png +0 -0
paypertranscript/assets/icons/arrow_down.svg +3 -0
paypertranscript/assets/sounds/start.wav +0 -0
paypertranscript/assets/sounds/stop.wav +0 -0
paypertranscript/assets/styles/dark.qss +388 -0
paypertranscript/core/__init__.py +0 -0
paypertranscript/core/audio_manager.py +142 -0
paypertranscript/core/config.py +360 -0
paypertranscript/core/cost_tracker.py +87 -0
paypertranscript/core/hotkey.py +294 -0
paypertranscript/core/logging.py +65 -0
paypertranscript/core/paths.py +28 -0
paypertranscript/core/recorder.py +167 -0
paypertranscript/core/session_logger.py +138 -0
paypertranscript/core/text_inserter.py +131 -0
paypertranscript/core/window_detector.py +58 -0
paypertranscript/pipeline/__init__.py +0 -0
paypertranscript/pipeline/transcription.py +361 -0
paypertranscript/providers/__init__.py +85 -0
paypertranscript/providers/base.py +78 -0
paypertranscript/providers/groq_provider.py +182 -0
paypertranscript/ui/__init__.py +0 -0
paypertranscript/ui/app.py +370 -0
paypertranscript/ui/dashboard.py +92 -0
paypertranscript/ui/overlay.py +396 -0
paypertranscript/ui/settings.py +550 -0
paypertranscript/ui/setup_wizard.py +690 -0
paypertranscript/ui/statistics.py +412 -0
paypertranscript/ui/tray.py +256 -0
paypertranscript/ui/window_mapping.py +460 -0
paypertranscript/ui/word_list.py +183 -0
paypertranscript-0.2.0.dist-info/METADATA +159 -0
paypertranscript-0.2.0.dist-info/RECORD +40 -0
paypertranscript-0.2.0.dist-info/WHEEL +5 -0
paypertranscript-0.2.0.dist-info/entry_points.txt +2 -0
paypertranscript-0.2.0.dist-info/licenses/LICENSE +21 -0
paypertranscript-0.2.0.dist-info/top_level.txt +1 -0

paypertranscript/core/config.py ADDED Viewed

@@ -0,0 +1,360 @@
+"""Konfigurationsmanagement für PayPerTranscript.
+JSON-basiert, Merge-on-Write, Schema-Validierung mit Fallback auf Defaults.
+Alle Laufzeit-Daten liegen unter %APPDATA%\\PayPerTranscript\\.
+"""
+import copy
+import json
+import os
+import sys
+from pathlib import Path
+from typing import Any
+from paypertranscript.core.logging import APPDATA_DIR, get_logger
+log = get_logger("core.config")
+CONFIG_FILE = APPDATA_DIR / "config.json"
+AUDIO_DIR = APPDATA_DIR / "audio"
+TRACKING_FILE = APPDATA_DIR / "tracking.json"
+DEFAULT_CONFIG: dict[str, Any] = {
+    "general": {
+        "language": "de",
+        "autostart": False,
+        "sound_enabled": False,
+        "hold_hotkey": ["ctrl", "cmd"],
+        "toggle_hotkey": None,
+        "streaming_typing": False,
+        "overlay_position": "mouse_cursor",
+    },
+    "api": {
+        "provider": "groq",
+        "stt_model": "whisper-large-v3-turbo",
+        "llm_model": "openai/gpt-oss-20b",
+    },
+    "words": {
+        "misspelled_words": [],
+    },
+    "formatting": {
+        "window_mappings": {
+            "WhatsApp.Root.exe": "casual",
+            "Telegram.exe": "casual",
+            "Discord.exe": "casual",
+            "Outlook": "professional",
+        },
+        "categories": {
+            "casual": {
+                "name": "Persönlich",
+                "prompt": (
+                    "Formatiere den folgenden transkribierten Text als lockere "
+                    "Chat-Nachricht. Alles kleingeschrieben, minimale Interpunktion, "
+                    "Kommas zur Trennung von Gedanken. Kein Punkt am Ende. "
+                    "Gib NUR den formatierten Text aus, keine Erklärungen."
+                ),
+            },
+            "professional": {
+                "name": "Professionell",
+                "prompt": (
+                    "Formatiere den folgenden transkribierten Text als professionelle "
+                    "Nachricht. Korrekte Groß-/Kleinschreibung, saubere Interpunktion, "
+                    "entferne Füllwörter und Wiederholungen. Sachlicher Stil, kurze "
+                    "Absätze. Gib NUR den formatierten Text aus, keine Erklärungen."
+                ),
+            },
+        },
+    },
+    "data": {
+        "audio_retention_hours": 24,
+        "save_transcripts": False,
+    },
+}
+# Schema: Erlaubte Typen pro Pfad für Validierung
+_SCHEMA: dict[str, type | tuple[type, ...]] = {
+    "general.language": str,
+    "general.autostart": bool,
+    "general.sound_enabled": bool,
+    "general.hold_hotkey": list,
+    "general.toggle_hotkey": (list, type(None)),
+    "general.streaming_typing": bool,
+    "general.overlay_position": str,
+    "api.provider": str,
+    "api.stt_model": str,
+    "api.llm_model": str,
+    "words.misspelled_words": list,
+    "formatting.window_mappings": dict,
+    "formatting.categories": dict,
+    "data.audio_retention_hours": (int, float),
+    "data.save_transcripts": bool,
+}
+def _deep_merge(base: dict, override: dict) -> dict:
+    """Merge override in base (rekursiv). Gibt neues Dict zurück."""
+    result = copy.deepcopy(base)
+    for key, value in override.items():
+        if key in result and isinstance(result[key], dict) and isinstance(value, dict):
+            result[key] = _deep_merge(result[key], value)
+        else:
+            result[key] = copy.deepcopy(value)
+    return result
+def _validate_config(config: dict) -> dict:
+    """Validiert Config gegen Schema. Ungültige Werte werden durch Defaults ersetzt."""
+    validated = copy.deepcopy(config)
+    for path, expected_type in _SCHEMA.items():
+        parts = path.split(".")
+        # Wert aus Config holen
+        node = validated
+        default_node = DEFAULT_CONFIG
+        valid = True
+        for part in parts[:-1]:
+            if isinstance(node, dict) and part in node:
+                node = node[part]
+                default_node = default_node[part]
+            else:
+                valid = False
+                break
+        if not valid:
+            continue
+        key = parts[-1]
+        if key not in node:
+            # Fehlender Wert → Default einsetzen
+            node[key] = copy.deepcopy(default_node[key])
+            log.warning("Config: Fehlender Wert '%s' → Default verwendet", path)
+        elif not isinstance(node[key], expected_type):
+            old_val = node[key]
+            node[key] = copy.deepcopy(default_node[key])
+            log.warning(
+                "Config: Ungültiger Typ für '%s' (%s statt %s) → Default verwendet",
+                path,
+                type(old_val).__name__,
+                expected_type,
+            )
+    return validated
+def _ensure_dirs() -> None:
+    """Erstellt alle nötigen Verzeichnisse."""
+    APPDATA_DIR.mkdir(parents=True, exist_ok=True)
+    AUDIO_DIR.mkdir(parents=True, exist_ok=True)
+class ConfigManager:
+    """Verwaltet die App-Konfiguration.
+    - Lädt Config aus JSON (mit Fallback auf Defaults)
+    - Merge-on-Write: bestehende Config lesen, neue Werte mergen, schreiben
+    - Schema-Validierung bei Load
+    """
+    def __init__(self) -> None:
+        _ensure_dirs()
+        self._config: dict[str, Any] = self._load()
+    def _load(self) -> dict[str, Any]:
+        """Lädt Config aus Datei, merged mit Defaults, validiert."""
+        if CONFIG_FILE.exists():
+            try:
+                raw = json.loads(CONFIG_FILE.read_text(encoding="utf-8"))
+                if not isinstance(raw, dict):
+                    log.warning("Config-Datei enthält kein Dict → Defaults verwendet")
+                    raw = {}
+            except (json.JSONDecodeError, OSError) as e:
+                log.warning("Config-Datei konnte nicht gelesen werden: %s → Defaults verwendet", e)
+                raw = {}
+        else:
+            log.info("Keine Config-Datei gefunden → Defaults werden verwendet")
+            raw = {}
+        merged = _deep_merge(DEFAULT_CONFIG, raw)
+        validated = _validate_config(merged)
+        return validated
+    def _save(self) -> None:
+        """Speichert aktuelle Config in Datei."""
+        _ensure_dirs()
+        try:
+            CONFIG_FILE.write_text(
+                json.dumps(self._config, indent=2, ensure_ascii=False),
+                encoding="utf-8",
+            )
+            log.debug("Config gespeichert: %s", CONFIG_FILE)
+        except OSError as e:
+            log.error("Config konnte nicht gespeichert werden: %s", e)
+    @property
+    def config(self) -> dict[str, Any]:
+        """Gibt die komplette Config als Dict zurück (Read-only Kopie)."""
+        return copy.deepcopy(self._config)
+    def get(self, path: str, default: Any = None) -> Any:
+        """Holt einen Wert per Punkt-Pfad (z.B. 'general.language').
+        Args:
+            path: Punkt-separierter Pfad zum Wert.
+            default: Fallback, wenn Pfad nicht existiert.
+        """
+        node = self._config
+        for part in path.split("."):
+            if isinstance(node, dict) and part in node:
+                node = node[part]
+            else:
+                return default
+        return copy.deepcopy(node)
+    def set(self, path: str, value: Any) -> None:
+        """Setzt einen Wert per Punkt-Pfad und speichert.
+        Merge-on-Write: Liest aktuelle Datei, merged, speichert.
+        Args:
+            path: Punkt-separierter Pfad (z.B. 'general.language').
+            value: Neuer Wert.
+        """
+        # Aktuellen Stand von Disk lesen (falls von außen geändert)
+        if CONFIG_FILE.exists():
+            try:
+                disk_config = json.loads(CONFIG_FILE.read_text(encoding="utf-8"))
+                if isinstance(disk_config, dict):
+                    self._config = _deep_merge(DEFAULT_CONFIG, disk_config)
+                    self._config = _validate_config(self._config)
+            except (json.JSONDecodeError, OSError):
+                pass
+        # Wert setzen
+        parts = path.split(".")
+        node = self._config
+        for part in parts[:-1]:
+            if part not in node or not isinstance(node[part], dict):
+                node[part] = {}
+            node = node[part]
+        node[parts[-1]] = value
+        log.info("Config geändert: %s = %s", path, value)
+        self._save()
+    def update(self, updates: dict[str, Any]) -> None:
+        """Merged ein Dict in die Config und speichert.
+        Args:
+            updates: Dict mit Werten zum Mergen (gleiche Struktur wie Config).
+        """
+        self._config = _deep_merge(self._config, updates)
+        self._config = _validate_config(self._config)
+        self._save()
+    def reload(self) -> None:
+        """Lädt Config erneut von Disk."""
+        self._config = self._load()
+        log.info("Config neu geladen")
+    def is_first_run(self) -> bool:
+        """Prüft ob dies der erste Start ist (keine Config-Datei vorhanden)."""
+        return not CONFIG_FILE.exists()
+    def save_initial(self) -> None:
+        """Speichert die initiale Config (nach Setup-Wizard)."""
+        self._save()
+# -- API-Key-Speicherung via Windows Credential Manager --
+KEYRING_SERVICE = "PayPerTranscript"
+KEYRING_ACCOUNT = "groq_api_key"
+def save_api_key(api_key: str) -> None:
+    """Speichert den API-Key im Windows Credential Manager (keyring)."""
+    import keyring
+    keyring.set_password(KEYRING_SERVICE, KEYRING_ACCOUNT, api_key)
+    log.info("API-Key im Credential Manager gespeichert")
+def load_api_key() -> str | None:
+    """Lädt den API-Key aus dem Windows Credential Manager (keyring).
+    Returns:
+        Den API-Key oder None wenn keiner gespeichert ist.
+    """
+    import keyring
+    try:
+        key = keyring.get_password(KEYRING_SERVICE, KEYRING_ACCOUNT)
+        if key:
+            log.debug("API-Key aus Credential Manager geladen")
+        return key
+    except Exception as e:
+        log.warning("Keyring-Zugriff fehlgeschlagen: %s", e)
+        return None
+# -- Autostart via Windows Startup-Folder --
+_STARTUP_DIR = Path(os.environ.get("APPDATA", "")) / (
+    r"Microsoft\Windows\Start Menu\Programs\Startup"
+)
+_SHORTCUT_NAME = "PayPerTranscript.lnk"
+def enable_autostart() -> bool:
+    """Erstellt Windows-Startup-Shortcut. Returns True bei Erfolg."""
+    try:
+        import shutil
+        import win32com.client  # type: ignore[import-untyped]
+        shortcut_path = _STARTUP_DIR / _SHORTCUT_NAME
+        shell = win32com.client.Dispatch("WScript.Shell")
+        shortcut = shell.CreateShortCut(str(shortcut_path))
+        # pip-installiertes GUI-Script suchen
+        entry_point = shutil.which("paypertranscript")
+        if entry_point:
+            shortcut.Targetpath = str(Path(entry_point))
+            shortcut.WorkingDirectory = str(Path.home())
+            shortcut.Arguments = ""
+        else:
+            # Fallback: pythonw.exe -m paypertranscript (kein CMD-Fenster)
+            python_dir = Path(sys.executable).parent
+            pythonw = python_dir / "pythonw.exe"
+            if not pythonw.exists():
+                log.warning("pythonw.exe nicht gefunden — Fallback auf python.exe")
+                pythonw = Path(sys.executable)
+            shortcut.Targetpath = str(pythonw)
+            shortcut.WorkingDirectory = str(Path.home())
+            shortcut.Arguments = "-m paypertranscript"
+        shortcut.Description = "PayPerTranscript — Voice-to-Text"
+        shortcut.save()
+        log.info("Autostart-Shortcut erstellt: %s", shortcut_path)
+        return True
+    except Exception as e:
+        log.error("Autostart konnte nicht aktiviert werden: %s", e)
+        return False
+def disable_autostart() -> bool:
+    """Entfernt Windows-Startup-Shortcut. Returns True bei Erfolg."""
+    try:
+        shortcut_path = _STARTUP_DIR / _SHORTCUT_NAME
+        if shortcut_path.exists():
+            shortcut_path.unlink()
+            log.info("Autostart-Shortcut entfernt: %s", shortcut_path)
+        return True
+    except Exception as e:
+        log.error("Autostart konnte nicht deaktiviert werden: %s", e)
+        return False
+def is_autostart_enabled() -> bool:
+    """Prüft ob der Autostart-Shortcut existiert."""
+    return (_STARTUP_DIR / _SHORTCUT_NAME).exists()

paypertranscript/core/cost_tracker.py ADDED Viewed

@@ -0,0 +1,87 @@
+"""Kostenberechnung fuer PayPerTranscript.
+Reine Berechnungsfunktionen fuer STT- und LLM-Kosten.
+Keine I/O, keine Seiteneffekte — einfach testbar.
+"""
+from dataclasses import dataclass
+# STT/LLM API-Preise (Stand: 2026-02)
+STT_PRICE_PER_HOUR_USD = 0.04
+STT_MIN_BILLED_SECONDS = 10  # API-seitiges Minimum-Billing
+LLM_INPUT_PRICE_PER_M_TOKENS = 0.075   # USD per million input tokens
+LLM_OUTPUT_PRICE_PER_M_TOKENS = 0.30   # USD per million output tokens
+@dataclass(frozen=True)
+class CostResult:
+    """Ergebnis einer Kostenberechnung."""
+    audio_duration_seconds: float
+    billed_seconds: float
+    stt_cost_usd: float
+    llm_input_tokens: int
+    llm_output_tokens: int
+    llm_cost_usd: float
+    total_cost_usd: float
+def calculate_stt_cost(audio_duration_seconds: float) -> tuple[float, float]:
+    """Berechnet STT-Kosten.
+    Args:
+        audio_duration_seconds: Tatsaechliche Audio-Dauer in Sekunden.
+    Returns:
+        Tuple (billed_seconds, cost_usd).
+    """
+    billed = max(audio_duration_seconds, STT_MIN_BILLED_SECONDS)
+    cost = billed / 3600.0 * STT_PRICE_PER_HOUR_USD
+    return billed, cost
+def calculate_llm_cost(input_tokens: int, output_tokens: int) -> float:
+    """Berechnet LLM-Kosten.
+    Args:
+        input_tokens: Anzahl Input-Tokens.
+        output_tokens: Anzahl Output-Tokens.
+    Returns:
+        Kosten in USD.
+    """
+    return (
+        input_tokens * LLM_INPUT_PRICE_PER_M_TOKENS
+        + output_tokens * LLM_OUTPUT_PRICE_PER_M_TOKENS
+    ) / 1_000_000
+def calculate_total_cost(
+    audio_duration_seconds: float,
+    llm_input_tokens: int = 0,
+    llm_output_tokens: int = 0,
+) -> CostResult:
+    """Berechnet Gesamtkosten einer Transkription.
+    Args:
+        audio_duration_seconds: Audio-Dauer in Sekunden.
+        llm_input_tokens: LLM Input-Tokens (0 wenn kein LLM).
+        llm_output_tokens: LLM Output-Tokens (0 wenn kein LLM).
+    Returns:
+        CostResult mit allen Kosten-Details.
+    """
+    billed, stt_cost = calculate_stt_cost(audio_duration_seconds)
+    llm_cost = calculate_llm_cost(llm_input_tokens, llm_output_tokens)
+    return CostResult(
+        audio_duration_seconds=audio_duration_seconds,
+        billed_seconds=billed,
+        stt_cost_usd=stt_cost,
+        llm_input_tokens=llm_input_tokens,
+        llm_output_tokens=llm_output_tokens,
+        llm_cost_usd=llm_cost,
+        total_cost_usd=stt_cost + llm_cost,
+    )