Change Whisper model from large to medium for improved performance
This commit is contained in:
2
main.py
2
main.py
@@ -65,7 +65,7 @@ console.print("✔ Hang kinyerve: audio.wav\n")
|
|||||||
# --- 2. Whisper STT (angol beszéd felismerés) ---
|
# --- 2. Whisper STT (angol beszéd felismerés) ---
|
||||||
console.print("🎤 [2/6] Speech-to-Text (Whisper, EN felismerés)…")
|
console.print("🎤 [2/6] Speech-to-Text (Whisper, EN felismerés)…")
|
||||||
|
|
||||||
model = whisper.load_model("large") # stabil, többnyelvű
|
model = whisper.load_model("medium") # stabil, többnyelvű
|
||||||
with Progress(TextColumn("Whisper STT…"), BarColumn(), TimeElapsedColumn(), TimeRemainingColumn()) as p:
|
with Progress(TextColumn("Whisper STT…"), BarColumn(), TimeElapsedColumn(), TimeRemainingColumn()) as p:
|
||||||
p.add_task("STT fut…", total=None)
|
p.add_task("STT fut…", total=None)
|
||||||
result = model.transcribe(AUDIO_WAV, language="en")
|
result = model.transcribe(AUDIO_WAV, language="en")
|
||||||
|
|||||||
Reference in New Issue
Block a user