Spaces:

Sambhavnoobcoder
/

PDF-text-extractor_sd_1

Runtime error

App Files Files Community

Sambhavnoobcoder commited on Jun 19, 2023

Commit

7917b4e

1 Parent(s): 33051d3

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -33

app.py CHANGED Viewed

@@ -21,47 +21,39 @@ def synthesize_audio(file, model_name_str, speaker_str):
 def main():
     logging.basicConfig(level=logging.INFO)
-    with gr.Interface(fn=None, title="PDF TO SPEECH CONVERTER", layout="rows", debug=True) as iface:
-        gr.Markdown(
-            """
-            <h1 align="center">PDF TO SPEECH CONVERTER</h1>
-            1. Insert a PDF
-            2. Select the model to synthesize with
-            3. Select speaker
-            4. Hit "Generate" and listen to the result!
-            When you select a model for the first time, it may take some time to download it.
-            This project is designed to bring the joy of reading without the hassle of looking over.
-            If you want an audiobook, you've got it!
-            """
-        )
-        file_input = gr.inputs.File(label="Upload PDF")
-        model_files = list_repo_files(repo_id="balacoon/tts")
-        model_name_dropdown = gr.inputs.Dropdown(label="Model", choices=model_files)
-        def set_model(model_name_str: str):
-            model_path = hf_hub_download(repo_id="balacoon/tts", filename=model_name_str)
-            global tts
-            tts = TTS(model_path)
-            speakers = tts.get_speakers()
-            default_speaker = speakers[-1]
-            return speakers, default_speaker
-        model_name_dropdown.set_action(set_model)
-        speaker_dropdown = gr.inputs.Dropdown(label="Speaker", choices=[])
-        audio = gr.outputs.Audio(label="Generated Audio", type="numpy")
-        def generate_audio(file, model_name_str, speaker_str):
-            return synthesize_audio(file, model_name_str, speaker_str)
-        iface.add_input(file_input)
-        iface.add_input(model_name_dropdown)
-        iface.add_input(speaker_dropdown)
-        iface.add_output(audio)
-        iface.run()
 if __name__ == "__main__":
     main()

 def main():
     logging.basicConfig(level=logging.INFO)
+    file_input = gr.inputs.File(label="Upload PDF")
+    model_files = list_repo_files(repo_id="balacoon/tts")
+    model_name_dropdown = gr.inputs.Dropdown(label="Model", choices=model_files)
+    def set_model(model_name_str: str):
+        model_path = hf_hub_download(repo_id="balacoon/tts", filename=model_name_str)
+        global tts
+        tts = TTS(model_path)
+        speakers = tts.get_speakers()
+        default_speaker = speakers[-1]
+        speaker_dropdown.choices = speakers
+        return speakers, default_speaker
+    speaker_dropdown = gr.inputs.Dropdown(label="Speaker", choices=[])
+    audio = gr.outputs.Audio(label="Generated Audio", type="numpy")
+    def generate_audio(file, model_name_str, speaker_str):
+        return synthesize_audio(file, model_name_str, speaker_str)
+    iface = gr.Interface(
+        fn=generate_audio,
+        inputs=[file_input, model_name_dropdown, speaker_dropdown],
+        outputs=audio,
+        title="PDF TO SPEECH CONVERTER",
+        layout="rows",
+        debug=True
+    )
+    model_name_dropdown.set_action(set_model)
+    iface.launch()
 if __name__ == "__main__":
     main()