feat: add automatic stop after a configurable amount of silence.

2026-02-18 16:12:54 +01:00
parent 85230a14a8
commit 134200d345
2 changed files with 56 additions and 1 deletions
--- a/calliope/app.py
+++ b/calliope/app.py
@@ -6,6 +6,8 @@ import threading
 import time
 from typing import Any

+import numpy as np
+
 import subprocess

 import rumps
@@ -54,6 +56,12 @@ class CalliopeApp(rumps.App):
        self._transcribe_done = threading.Event()
        self._transcribe_done.set()  # not transcribing initially

+        # Silence-based auto-stop
+        self._silence_since: float | None = None
+        self._rec_has_speech: bool = False
+        self._silence_stop_evt: threading.Event = threading.Event()
+        self._silence_stop_evt.set()  # not monitoring initially
+
        self.status_item = rumps.MenuItem("Status: Loading model...")
        self.status_item.set_callback(None)
        self.toggle_item = rumps.MenuItem("Start Recording", callback=self._on_toggle_click)
@@ -86,6 +94,13 @@ class CalliopeApp(rumps.App):
        self._pp_menu = rumps.MenuItem("Post-Processing")
        self._build_pp_menu()

+        # Auto-stop on silence toggle
+        auto_stop = cfg.get("auto_stop_silence", True)
+        prefix = "\u2713 " if auto_stop else "   "
+        self._auto_stop_item = rumps.MenuItem(
+            f"{prefix}Auto-stop on Silence", callback=self._on_auto_stop_toggle
+        )
+
        # Typing mode submenu
        self._typing_menu = rumps.MenuItem("Typing Mode")
        current_mode = cfg.get("typing_mode", "char")
@@ -101,6 +116,7 @@ class CalliopeApp(rumps.App):
            self.status_item,
            None,
            self.toggle_item,
+            self._auto_stop_item,
            self.context_item,
            self._lang_menu,
            self._model_menu,
@@ -302,7 +318,10 @@ class CalliopeApp(rumps.App):
        self.title = "\U0001f534 0:00"  # 🔴
        self.toggle_item.title = "Stop Recording"
        self.status_item.title = "Status: Recording..."
-        self.recorder.on_audio = self.overlay.push_samples
+        self._silence_since = None
+        self._rec_has_speech = False
+        self._silence_stop_evt = threading.Event()
+        self.recorder.on_audio = self._on_audio_chunk
        try:
            self.recorder.start()
        except Exception:
@@ -317,6 +336,8 @@ class CalliopeApp(rumps.App):
        self.overlay.show()
        self._rec_timer = rumps.Timer(self._update_rec_duration, 1)
        self._rec_timer.start()
+        if self.cfg.get("auto_stop_silence", True):
+            threading.Thread(target=self._silence_monitor, daemon=True).start()
        self._notify("Calliope", "", "Recording started")
        log.info("Recording started")

@@ -325,6 +346,7 @@ class CalliopeApp(rumps.App):
            if not self._recording:
                return
            self._recording = False
+        self._silence_stop_evt.set()
        if self._rec_timer:
            self._rec_timer.stop()
            self._rec_timer = None
@@ -341,6 +363,37 @@ class CalliopeApp(rumps.App):
        self._transcribe_done.clear()
        threading.Thread(target=self._transcribe_and_type, args=(audio,), daemon=True).start()

+    def _on_audio_chunk(self, chunk: np.ndarray) -> None:
+        """Called from the audio thread on every recorder chunk."""
+        self.overlay.push_samples(chunk)
+        rms = float(np.sqrt(np.mean(chunk ** 2)))
+        threshold = self.cfg.get("silence_threshold", 0.005)
+        if rms >= threshold:
+            self._rec_has_speech = True
+            self._silence_since = None
+        elif self._rec_has_speech and self._silence_since is None:
+            self._silence_since = time.monotonic()
+
+    def _silence_monitor(self) -> None:
+        """Background thread: trigger auto-stop after sustained silence."""
+        timeout = self.cfg.get("silence_timeout_seconds", 1.5)
+        stop_evt = self._silence_stop_evt
+        while not stop_evt.is_set():
+            since = self._silence_since
+            if since is not None and (time.monotonic() - since) >= timeout:
+                log.info("Auto-stop: %.1fs of silence detected", timeout)
+                self._stop_and_transcribe()
+                break
+            stop_evt.wait(0.1)
+
+    def _on_auto_stop_toggle(self, sender) -> None:
+        enabled = not self.cfg.get("auto_stop_silence", True)
+        self.cfg["auto_stop_silence"] = enabled
+        config_mod.save(self.cfg)
+        prefix = "\u2713 " if enabled else "   "
+        self._auto_stop_item.title = f"{prefix}Auto-stop on Silence"
+        log.info("Auto-stop on silence %s", "enabled" if enabled else "disabled")
+
    def _update_rec_duration(self, timer) -> None:
        if self._rec_start_time is None:
            return
--- a/calliope/config.py
+++ b/calliope/config.py
@@ -26,6 +26,8 @@ DEFAULTS: dict[str, Any] = {
    "silence_threshold": 0.005,  # RMS energy below which audio is considered silence
    "notifications": True,  # show macOS notifications
    "typing_delay": 0.005,  # seconds between keystrokes in char mode
+    "auto_stop_silence": True,  # stop recording automatically after sustained silence
+    "silence_timeout_seconds": 1.5,  # seconds of silence before auto-stop
    "postprocessing": {
        "enabled": False,
        "model": None,          # active model HF repo id