Use GitHub orpheus-tts (supports max_model_len) to fix OOM on Jetson

2026-01-11 17:39:55 -06:00
parent 86cf77d2d9
commit 0e43b76204
3 changed files with 11 additions and 6 deletions
--- a/main.py
+++ b/main.py
@@ -326,9 +326,11 @@ async def startup():
    print("Loading Orpheus model (this may take a moment)...")
    from orpheus_tts import OrpheusModel
    
-    # Note: PyPI orpheus-speech 0.1.0 uses simpler API
-    # model_name can be "medium-3b" or full HF path
-    model = OrpheusModel(model_name=ORPHEUS_MODEL)
+    # GitHub version supports max_model_len for memory control
+    model = OrpheusModel(
+        model_name=ORPHEUS_MODEL,
+        max_model_len=MAX_MODEL_LEN
+    )
    
    print("✓ Orpheus model loaded successfully")