0.2.8 : only the decoder of whisper is loaded in memory when a different encoder is used

2026-03-07 14:23:18 +00:00 · 2025-09-02 21:12:25 +02:00
parent 50b0527858
commit 3bd2122eb4
11 changed files with 112 additions and 47 deletions
--- a/whisperlivekit/parse_args.py
+++ b/whisperlivekit/parse_args.py
@@ -161,6 +161,14 @@ def parse_args():

    # SimulStreaming-specific arguments
    simulstreaming_group = parser.add_argument_group('SimulStreaming arguments (only used with --backend simulstreaming)')
+
+    simulstreaming_group.add_argument(
+        "--disable-fast-encoder",
+        action="store_true",
+        default=False,
+        dest="disable_fast_encoder",
+        help="Disable Faster Whisper or MLX Whisper backends for encoding (if installed). Slower but helpful when GPU memory is limited",
+    )
    
    simulstreaming_group.add_argument(
        "--frame-threshold",