From 614ff841fe5a1d823dee66a0c41eafedc590e8ff Mon Sep 17 00:00:00 2001 From: michael Date: Sun, 28 Dec 2025 21:20:03 -0600 Subject: [PATCH] feat: upgrade Whisper model from base to large-v3 MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Uses the multilingual large model for more accurate transcription and sentence boundary detection. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude Opus 4.5 --- backend/app/core/config.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/backend/app/core/config.py b/backend/app/core/config.py index ec692fb..dc7a4fd 100644 --- a/backend/app/core/config.py +++ b/backend/app/core/config.py @@ -165,7 +165,7 @@ class Settings(BaseSettings): gemini_tts_speed_step: float = 0.1 # Whisper Configuration (for pause point refinement) - whisper_model: str = "base" # Options: tiny, base, small, medium, large-v3 + whisper_model: str = "large-v3" # Options: tiny, base, small, medium, large-v3 whisper_max_search_window: float = 5.0 # Max seconds to search for speech gap after Gemini point whisper_sentence_gap_threshold: float = 0.5 # Gap duration to classify as sentence boundary whisper_phrase_gap_threshold: float = 0.3 # Gap duration to classify as phrase boundary