0.2.8 : only the decoder of whisper is loaded in memory when a different encoder is used

2026-03-07 22:33:36 +00:00 · 2025-09-02 21:12:25 +02:00
parent 50b0527858
commit 3bd2122eb4
11 changed files with 112 additions and 47 deletions
--- a/whisperlivekit/basic_server.py
+++ b/whisperlivekit/basic_server.py
@@ -19,6 +19,15 @@ transcription_engine = None

@asynccontextmanager
 async def lifespan(app: FastAPI):
+    
+    #to remove after 0.2.8
+    if args.backend == "simulstreaming" and not args.disable_fast_encoder:
+        logger.warning(f"""
+{'='*50}
+WhisperLiveKit 0.2.8 has introduced a new fast encoder feature using MLX Whisper or Faster Whisper for improved speed. Use --disable-fast-encoder to disable if you encounter issues.
+{'='*50}
+    """)
+    
    global transcription_engine
    transcription_engine = TranscriptionEngine(
        **vars(args),