Add scripts
This commit is contained in:
parent
c196f14ae9
commit
992a748c51
5 changed files with 230 additions and 0 deletions
44
scripts/local_whisper.py
Normal file
44
scripts/local_whisper.py
Normal file
|
|
@ -0,0 +1,44 @@
|
|||
#!/usr/bin/env python3
|
||||
"""
|
||||
Транскрипция аудио через faster-whisper с исправлением MKL ошибки.
|
||||
|
||||
ИСПОЛЬЗОВАНИЕ:
|
||||
import os
|
||||
os.environ["MKL_SERVICE_FORCE_INTEL"] = "1"
|
||||
os.environ["OMP_NUM_THREADS"] = "2"
|
||||
|
||||
from faster_whisper import WhisperModel
|
||||
model = WhisperModel("small")
|
||||
"""
|
||||
|
||||
import os
|
||||
import sys
|
||||
|
||||
# CRITICAL: Must be set BEFORE importing faster_whisper
|
||||
os.environ["MKL_SERVICE_FORCE_INTEL"] = "1"
|
||||
os.environ["OMP_NUM_THREADS"] = "2"
|
||||
|
||||
from faster_whisper import WhisperModel
|
||||
|
||||
def transcribe_audio(audio_path, model_size="small", language="ru"):
|
||||
"""Транскрибирует аудиофайл."""
|
||||
print(f"Loading model {model_size}...")
|
||||
model = WhisperModel(model_size)
|
||||
|
||||
print(f"Transcribing {audio_path}...")
|
||||
segments, _ = model.transcribe(audio_path, language=language)
|
||||
|
||||
# Convert to list for proper handling
|
||||
segments = list(segments)
|
||||
|
||||
return segments
|
||||
|
||||
if __name__ == "__main__":
|
||||
if len(sys.argv) < 2:
|
||||
print("Usage: python3 local_whisper.py <audio.wav>")
|
||||
sys.exit(1)
|
||||
|
||||
segments = transcribe_audio(sys.argv[1])
|
||||
|
||||
for segment in segments:
|
||||
print(segment.text)
|
||||
Loading…
Add table
Add a link
Reference in a new issue