PyPI - speaker-detector - Versions diffs - 0.1.6__tar.gz → 0.1.7__tar.gz - Mend

speaker-detector 0.1.6tar.gz → 0.1.7tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

{speaker_detector-0.1.6 → speaker_detector-0.1.7}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: speaker-detector
-Version: 0.1.6
+Version: 0.1.7
 Summary: A CLI + Web tool for speaker enrollment and identification using SpeechBrain.
 Author-email: Lara Whybrow <lara.whybrow@gmail.com>
 License: MIT
@@ -29,7 +29,7 @@ Requires-Dist: sounddevice
 Requires-Dist: soundfile
 Requires-Dist: pydub
-Note: Still in development, as I am configuring the system for the most performant approach. Feel free to jump on the project with me.
+23/07/2025 - Lara Whybrow, Creator - Works as far as I can see, but now we have a robust set of tools for training and managing the data and can focus now on refinement and bug fixing.
 # speaker-detector 🎙️

{speaker_detector-0.1.6 → speaker_detector-0.1.7}/README.md RENAMED Viewed

@@ -1,4 +1,4 @@
-Note: Still in development, as I am configuring the system for the most performant approach. Feel free to jump on the project with me.
+23/07/2025 - Lara Whybrow, Creator - Works as far as I can see, but now we have a robust set of tools for training and managing the data and can focus now on refinement and bug fixing.
 # speaker-detector 🎙️

{speaker_detector-0.1.6 → speaker_detector-0.1.7}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 [project]
 name = "speaker-detector"
-version = "0.1.6"
+version = "0.1.7"
 description = "A CLI + Web tool for speaker enrollment and identification using SpeechBrain."
 readme = "README.md"
 requires-python = ">=3.8"

speaker_detector-0.1.7/speaker_detector/constants.py ADDED Viewed

@@ -0,0 +1,10 @@
+# speaker_detector/constants.py
+BACKEND_VERSION = "0.1.7"
+# API base paths (optional, for future centralization)
+API_PREFIX = "/api"
+# Thresholds and default settings
+DEFAULT_CONFIDENCE_THRESHOLD = 0.75
+DEFAULT_INTERVAL_MS = 3000

{speaker_detector-0.1.6 → speaker_detector-0.1.7}/speaker_detector/core.py RENAMED Viewed

@@ -114,3 +114,5 @@ def get_speakers_needing_rebuild() -> list[str]:
 # ── ALIAS FOR COMPATIBILITY ──────────────────────────────────────────────────
 rebuild_embeddings_for_speaker = rebuild_embedding

{speaker_detector-0.1.6 → speaker_detector-0.1.7}/speaker_detector/server.py RENAMED Viewed

@@ -1,26 +1,36 @@
 # ── Core Imports ─────────────────────────────────────────────
 import os, signal, time
-from flask import Flask, request, send_from_directory, send_file
+from flask import Flask, request, send_from_directory, send_file, jsonify
 from flask_cors import CORS
 from pathlib import Path
 # ── Internal Modules ─────────────────────────────────────────
-from speaker_detector.state import stop_event
 from speaker_detector.utils.paths import STATIC_DIR, INDEX_HTML, COMPONENTS_DIR
+from speaker_detector.speaker_state import LISTENING_MODE, start_detection_loop, stop_detection_loop, stop_event
+from speaker_detector.constants import BACKEND_VERSION
 # ── App Setup ────────────────────────────────────────────────
 app = Flask(__name__, static_folder=str(STATIC_DIR))
-CORS(app)
+CORS(app, resources={r"/api/*": {"origins": "*"}}, supports_credentials=True)
 # ── Routes ──────────────────────────────────────────────────
-@app.after_request
-def apply_csp(response):
-    response.headers["Content-Security-Policy"] = (
-        "default-src 'self'; script-src 'self'; style-src 'self'; object-src 'none';"
-    )
+@app.route("/api/<path:dummy>", methods=["OPTIONS"])
+def cors_preflight(dummy):
+    response = jsonify({"ok": True})
+    response.headers["Access-Control-Allow-Origin"] = "*"
+    response.headers["Access-Control-Allow-Headers"] = "Content-Type,Authorization"
+    response.headers["Access-Control-Allow-Methods"] = "GET,POST,OPTIONS"
     return response
+@app.route("/api/version")
+def get_version():
+    return jsonify({"version": BACKEND_VERSION})
 @app.route("/")
 def serve_index():
     return send_file(INDEX_HTML)
@@ -47,22 +57,25 @@ def not_found(e):
 # ── Route Registrations ─────────────────────────────────────
 from speaker_detector.routes.index_routes import index_bp
-from speaker_detector.routes.settings_routes import settings_bp
+from speaker_detector.routes.listening_mode_routes import listening_bp
 from speaker_detector.routes.speaker_routes import speakers_bp
 from speaker_detector.routes.background_routes import background_bp
 from speaker_detector.routes.rebuild_routes import rebuild_bp
 from speaker_detector.routes.identify_routes import identify_bp
 from speaker_detector.routes.recordings_routes import recordings_bp
 from speaker_detector.routes.meetings_routes import meetings_bp
+from speaker_detector.routes.correction_routes import correction_bp
 app.register_blueprint(index_bp)
-app.register_blueprint(settings_bp)
+app.register_blueprint(listening_bp)
 app.register_blueprint(speakers_bp)
 app.register_blueprint(background_bp)
 app.register_blueprint(rebuild_bp)
 app.register_blueprint(identify_bp)
 app.register_blueprint(recordings_bp)
 app.register_blueprint(meetings_bp)
+app.register_blueprint(correction_bp)
 # ── Interrupt Handler ───────────────────────────────────────
 def handle_interrupt(sig, frame):

speaker_detector-0.1.7/speaker_detector/speaker_state.py ADDED Viewed

@@ -0,0 +1,103 @@
+# speaker_detector/speaker_state.py
+import threading
+import tempfile
+import time
+import sounddevice as sd
+import soundfile as sf
+from datetime import datetime
+from speaker_detector.constants import DEFAULT_CONFIDENCE_THRESHOLD, DEFAULT_INTERVAL_MS
+from speaker_detector.core import identify_speaker
+# ── Shared Speaker Detection State ─────────────────────────────
+current_speaker_state = {
+    "speaker": None,
+    "confidence": None,
+    "is_speaking": False,
+}
+def get_current_speaker():
+    return current_speaker_state
+LISTENING_MODE = {"mode": "off"}  # Options: "off", "single", "multi"
+DETECTION_INTERVAL_MS = DEFAULT_INTERVAL_MS
+DETECTION_THRESHOLD = DEFAULT_CONFIDENCE_THRESHOLD
+MIC_AVAILABLE = True
+stop_event = threading.Event()
+detection_thread = None
+# ── Background Detection Loop ─────────────────────────────
+def detection_loop():
+    global MIC_AVAILABLE
+    samplerate = 16000
+    duration = 2  # seconds
+    while not stop_event.is_set():
+        try:
+            audio = sd.rec(int(duration * samplerate), samplerate=samplerate, channels=1, dtype="int16")
+            sd.wait()
+            with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as tmp:
+                sf.write(tmp.name, audio, samplerate)
+                MIC_AVAILABLE = True
+                speaker, conf = identify_speaker(tmp.name, threshold=DETECTION_THRESHOLD)
+                current_speaker_state["speaker"] = speaker
+                current_speaker_state["confidence"] = conf
+                current_speaker_state["is_speaking"] = speaker != "unknown" and conf >= DETECTION_THRESHOLD
+                print(f"{datetime.now().strftime('%H:%M:%S')} 🧠 Detected: {speaker} ({conf:.2f})")
+        except Exception as e:
+            print(f"❌ Detection loop error: {e}")
+            current_speaker_state["speaker"] = None
+            current_speaker_state["confidence"] = None
+            current_speaker_state["is_speaking"] = False
+            if isinstance(e, sd.PortAudioError):
+                MIC_AVAILABLE = False
+        time.sleep(DETECTION_INTERVAL_MS / 1000.0)
+# ── Lifecycle Control ─────────────────────────────────────
+def start_detection_loop():
+    global detection_thread
+    if detection_thread and detection_thread.is_alive():
+        return
+    print("🔁 Starting detection loop...")
+    stop_event.clear()
+    detection_thread = threading.Thread(target=detection_loop, daemon=True)
+    detection_thread.start()
+def stop_detection_loop():
+    if detection_thread and detection_thread.is_alive():
+        print("⏹️ Stopping detection loop...")
+        stop_event.set()
+def get_active_speaker():
+    if LISTENING_MODE["mode"] == "off":
+        return {
+            "speaker": None,
+            "confidence": None,
+            "is_speaking": False,
+            "status": "disabled"
+        }
+    if not MIC_AVAILABLE:
+        return {
+            "speaker": None,
+            "confidence": None,
+            "is_speaking": False,
+            "status": "mic unavailable"
+        }
+    return {
+        "speaker": current_speaker_state.get("speaker"),
+        "confidence": current_speaker_state.get("confidence"),
+        "is_speaking": current_speaker_state.get("is_speaking", False),
+        "status": "listening"
+    }

{speaker_detector-0.1.6 → speaker_detector-0.1.7}/speaker_detector.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: speaker-detector
-Version: 0.1.6
+Version: 0.1.7
 Summary: A CLI + Web tool for speaker enrollment and identification using SpeechBrain.
 Author-email: Lara Whybrow <lara.whybrow@gmail.com>
 License: MIT
@@ -29,7 +29,7 @@ Requires-Dist: sounddevice
 Requires-Dist: soundfile
 Requires-Dist: pydub
-Note: Still in development, as I am configuring the system for the most performant approach. Feel free to jump on the project with me.
+23/07/2025 - Lara Whybrow, Creator - Works as far as I can see, but now we have a robust set of tools for training and managing the data and can focus now on refinement and bug fixing.
 # speaker-detector 🎙️

{speaker_detector-0.1.6 → speaker_detector-0.1.7}/speaker_detector.egg-info/SOURCES.txt RENAMED Viewed

@@ -2,10 +2,11 @@ README.md
 pyproject.toml
 speaker_detector/__main__.py
 speaker_detector/cli.py
+speaker_detector/constants.py
 speaker_detector/core.py
 speaker_detector/server copy.py
 speaker_detector/server.py
-speaker_detector/state.py
+speaker_detector/speaker_state.py
 speaker_detector.egg-info/PKG-INFO
 speaker_detector.egg-info/SOURCES.txt
 speaker_detector.egg-info/dependency_links.txt

speaker_detector-0.1.6/speaker_detector/state.py DELETED Viewed

@@ -1,69 +0,0 @@
-# speaker_detector/state.py
-import threading
-import tempfile
-import time
-import sounddevice as sd
-import soundfile as sf
-from datetime import datetime
-from pathlib import Path
-from speaker_detector.core import identify_speaker  # ✅ safe import — no circular loop
-# ── Global State ─────────────────────────────────────────────
-current_speaker = {"speaker": None, "confidence": None}
-LISTENING_MODE = {"mode": "off"}  # Values: "off", "single", "multi"
-DETECTION_INTERVAL_MS = 3000
-DETECTION_THRESHOLD = 0.75
-MIC_AVAILABLE = True
-stop_event = threading.Event()  # ✅ defined here, no self-import
-detection_thread = None
-# ── Background Detection Loop ────────────────────────────────
-def detection_loop():
-    global MIC_AVAILABLE
-    samplerate = 16000
-    duration = 2
-    while not stop_event.is_set():
-        try:
-            audio = sd.rec(int(duration * samplerate), samplerate=samplerate, channels=1, dtype="int16")
-            sd.wait()
-            with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as tmp:
-                sf.write(tmp.name, audio, samplerate)
-                MIC_AVAILABLE = True
-                speaker, conf = identify_speaker(tmp.name, threshold=DETECTION_THRESHOLD)
-                current_speaker.update(speaker=speaker, confidence=conf)
-                print(f"{datetime.now().strftime('%H:%M:%S')} 🧠 Detected: {speaker} ({conf:.2f})")
-        except Exception as e:
-            print(f"❌ Detection loop error: {e}")
-            current_speaker.update(speaker=None, confidence=None)
-            if isinstance(e, sd.PortAudioError):
-                MIC_AVAILABLE = False
-        time.sleep(DETECTION_INTERVAL_MS / 1000.0)
-# ── Control Functions ────────────────────────────────────────
-def start_detection_loop():
-    global detection_thread
-    if detection_thread and detection_thread.is_alive():
-        return
-    print("🔁 Starting detection loop...")
-    stop_event.clear()
-    detection_thread = threading.Thread(target=detection_loop, daemon=True)
-    detection_thread.start()
-def stop_detection_loop():
-    if detection_thread and detection_thread.is_alive():
-        print("⏹️ Stopping detection loop...")
-        stop_event.set()
-def get_active_speaker():
-    if LISTENING_MODE["mode"] == "off":
-        return {"speaker": None, "confidence": None, "status": "disabled"}
-    if not MIC_AVAILABLE:
-        return {"speaker": None, "confidence": None, "status": "mic unavailable"}
-    return {**current_speaker, "status": "listening"}