asr-inference

Running on Zero

ssolito commited on 7 days ago

Commit

790d7cc

verified ·

1 Parent(s): 24a2822

Update whisper.py (#14)

- Update whisper.py (beabd7ce92d057ea91e8993afddf9e989f891719)

Co-authored-by: Sarah Solito <ssolito@users.noreply.huggingface.co>

Files changed (1) hide show

whisper.py CHANGED Viewed

@@ -134,6 +134,8 @@ def generate(audio_path, use_v2):
         output = ""
         for start, end, speaker, text in merged_transcript:
             output += f"[{speaker}]: {text}\n"
     else:
         audio = AudioSegment.from_wav(audio_path)
@@ -144,8 +146,7 @@ def generate(audio_path, use_v2):
             audio.export(temp_mono_path, format="wav")
             audio_path = temp_mono_path
         output = transcribe_pipeline(format_audio(audio_path), task)
-    clean_output = post_process_transcription(output, max_repeats=1) #check
     if temp_mono_path and os.path.exists(temp_mono_path):
         os.remove(temp_mono_path)

         output = ""
         for start, end, speaker, text in merged_transcript:
             output += f"[{speaker}]: {text}\n"
+        clean_output = output.strip()
     else:
         audio = AudioSegment.from_wav(audio_path)
             audio.export(temp_mono_path, format="wav")
             audio_path = temp_mono_path
         output = transcribe_pipeline(format_audio(audio_path), task)
+        clean_output = post_process_transcription(output)
     if temp_mono_path and os.path.exists(temp_mono_path):
         os.remove(temp_mono_path)