fix number bug in whisperx alignment

2025-06-05 21:49:11 +02:00 · 2024-04-25 14:38:03 -05:00
parent 4a3a8f11a7
commit fd20265324
1 changed files with 3 additions and 1 deletions
--- a/gradio_app.py
+++ b/gradio_app.py
@@ -74,6 +74,8 @@ class WhisperxModel:

    def transcribe(self, audio_path):
        segments = self.model.transcribe(audio_path, batch_size=8)["segments"]
+        for segment in segments:
+            segment['text'] = replace_numbers_with_words(segment['text'])
        return self.align_model.align(segments, audio_path)


@@ -177,7 +179,7 @@ def align(seed, transcript, audio_path):
    if align_model is None:
        raise gr.Error("Align model not loaded")
    seed_everything(seed)
-
+    transcript = replace_numbers_with_words(transcript).replace("  ", " ").replace("  ", " ")
    fragments = align_segments(transcript, audio_path)
    segments = [{
        "start": float(fragment["begin"]),