Change Whisper model from large to medium for improved performance

This commit is contained in:
2025-11-30 21:33:34 +01:00
parent 6f3b862bdb
commit 347cf7f50d

View File

@@ -65,7 +65,7 @@ console.print("✔ Hang kinyerve: audio.wav\n")
# --- 2. Whisper STT (angol beszéd felismerés) --- # --- 2. Whisper STT (angol beszéd felismerés) ---
console.print("🎤 [2/6] Speech-to-Text (Whisper, EN felismerés)…") console.print("🎤 [2/6] Speech-to-Text (Whisper, EN felismerés)…")
model = whisper.load_model("large") # stabil, többnyelvű model = whisper.load_model("medium") # stabil, többnyelvű
with Progress(TextColumn("Whisper STT…"), BarColumn(), TimeElapsedColumn(), TimeRemainingColumn()) as p: with Progress(TextColumn("Whisper STT…"), BarColumn(), TimeElapsedColumn(), TimeRemainingColumn()) as p:
p.add_task("STT fut…", total=None) p.add_task("STT fut…", total=None)
result = model.transcribe(AUDIO_WAV, language="en") result = model.transcribe(AUDIO_WAV, language="en")