Spaces:

Luigi
/

Whisper-vs-Sensevoice-Small

Running on Zero

Luigi commited on Jun 3

Commit

0ae11fc

1 Parent(s): c680485

improve exception handling on sensevoice branch

Files changed (1) hide show

app.py CHANGED Viewed

@@ -279,6 +279,7 @@ def _transcribe_sense_gpu_stream(model_id: str, language: str, audio_path: str,
         diary = diarizer({"waveform": waveform, "sample_rate": sample_rate}, hook=hook)
     snippets = []
     cache = {}
     for turn, _, speaker in diary.itertracks(yield_label=True):
         start_ms, end_ms = int(turn.start*1000), int(turn.end*1000)
         segment = AudioSegment.from_file(audio_path)[start_ms:end_ms]
@@ -290,11 +291,12 @@ def _transcribe_sense_gpu_stream(model_id: str, language: str, audio_path: str,
             except Exception as e:
                 cprint(f'Error: {e}','red')
         os.unlink(tmp.name)
-        txt = rich_transcription_postprocess(segs[0]['text'])
-        if not enable_punct:
-            txt = re.sub(r"[^\w\s]", "", txt)
-        txt = converter.convert(txt)
-        snippets.append(f"[{speaker}] {txt}")
         yield "", format_diarization_html(snippets)
     return

         diary = diarizer({"waveform": waveform, "sample_rate": sample_rate}, hook=hook)
     snippets = []
     cache = {}
+    segs = None
     for turn, _, speaker in diary.itertracks(yield_label=True):
         start_ms, end_ms = int(turn.start*1000), int(turn.end*1000)
         segment = AudioSegment.from_file(audio_path)[start_ms:end_ms]
             except Exception as e:
                 cprint(f'Error: {e}','red')
         os.unlink(tmp.name)
+        if segs:
+            txt = rich_transcription_postprocess(segs[0]['text'])
+            if not enable_punct:
+                txt = re.sub(r"[^\w\s]", "", txt)
+            txt = converter.convert(txt)
+            snippets.append(f"[{speaker}] {txt}")
         yield "", format_diarization_html(snippets)
     return