DeeeeeeM
commited on
Commit
·
5899607
1
Parent(s):
77b6231
added fixes for srt output
Browse files- .gitignore +2 -1
- app.py +8 -2
.gitignore
CHANGED
@@ -1 +1,2 @@
|
|
1 |
-
.gradio/
|
|
|
|
1 |
+
.gradio/
|
2 |
+
.vscode/
|
app.py
CHANGED
@@ -25,12 +25,12 @@ def process_media(
|
|
25 |
if model_type == "faster whisper":
|
26 |
device = "cuda" if torch.cuda.is_available() else "cpu"
|
27 |
model = stable_whisper.load_faster_whisper(model_size, device=device)
|
28 |
-
result = model.transcribe(temp_path, language=source_lang, vad=True, regroup=False,
|
29 |
else:
|
30 |
device = "cuda" if torch.cuda.is_available() else "cpu"
|
31 |
model = stable_whisper.load_model(model_size, device=device)
|
32 |
result = model.transcribe(temp_path, language=source_lang, vad=True, regroup=False, no_speech_threshold=0.9, denoiser="demucs")
|
33 |
-
#, batch_size=16
|
34 |
#result.save_as_json(word_transcription_path)
|
35 |
|
36 |
# ADVANCED SETTINGS #
|
@@ -131,6 +131,12 @@ def optimize_text(text, max_lines_per_segment, line_penalty, longest_line_char_p
|
|
131 |
|
132 |
backtrack(0, 0, 0, [])
|
133 |
|
|
|
|
|
|
|
|
|
|
|
|
|
134 |
optimized = '\n'.join(' '.join(words) for words in bestSplit)
|
135 |
return optimized
|
136 |
|
|
|
25 |
if model_type == "faster whisper":
|
26 |
device = "cuda" if torch.cuda.is_available() else "cpu"
|
27 |
model = stable_whisper.load_faster_whisper(model_size, device=device)
|
28 |
+
result = model.transcribe(temp_path, language=source_lang, vad=True, regroup=False,no_speech_threshold=0.9)
|
29 |
else:
|
30 |
device = "cuda" if torch.cuda.is_available() else "cpu"
|
31 |
model = stable_whisper.load_model(model_size, device=device)
|
32 |
result = model.transcribe(temp_path, language=source_lang, vad=True, regroup=False, no_speech_threshold=0.9, denoiser="demucs")
|
33 |
+
#, batch_size=16, denoiser="demucs"
|
34 |
#result.save_as_json(word_transcription_path)
|
35 |
|
36 |
# ADVANCED SETTINGS #
|
|
|
131 |
|
132 |
backtrack(0, 0, 0, [])
|
133 |
|
134 |
+
if not bestSplit:
|
135 |
+
return text
|
136 |
+
|
137 |
+
if len(bestSplit) > max_lines_per_segment or any(len(line) == 1 for line in bestSplit):
|
138 |
+
return text
|
139 |
+
|
140 |
optimized = '\n'.join(' '.join(words) for words in bestSplit)
|
141 |
return optimized
|
142 |
|