Python Usage¶
Transcribe audio¶
from pathlib import Path
from whisper_smith.exporters import export_transcript
from whisper_smith.transcribe import transcribe_audio
result = transcribe_audio(Path("data/sample.m4a"))
print(result.text)
srt = export_transcript(result, "srt")
Path("data/sample.srt").write_text(srt, encoding="utf-8")
Diarize audio¶
from pathlib import Path
from whisper_smith.diarize import diarize_audio
result = diarize_audio(Path("data/sample.m4a"))
for segment in result.segments:
print(segment.start, segment.end, segment.speaker)
Assign speakers¶
from whisper_smith.align import assign_speakers
aligned = assign_speakers(transcript, diarization)
Export JSON¶
from pathlib import Path
from whisper_smith.exporters import export_json
Path("data/sample.aligned.json").write_text(
export_json(aligned),
encoding="utf-8",
)