Spaces:
Running
on
Zero
Running
on
Zero
Commit
·
297dc79
1
Parent(s):
e7cbc76
Update app.py
Browse files
app.py
CHANGED
@@ -15,6 +15,7 @@ from typing import Union
|
|
15 |
from diffusers.utils.torch_utils import randn_tensor
|
16 |
from tqdm import tqdm
|
17 |
from TangoFlux import TangoFluxInference
|
|
|
18 |
|
19 |
|
20 |
|
@@ -44,7 +45,7 @@ Generate audio using Tango2 by providing a text prompt. Tango2 was built from Ta
|
|
44 |
"""
|
45 |
# Gradio input and output components
|
46 |
input_text = gr.Textbox(lines=2, label="Prompt")
|
47 |
-
output_format = gr.Radio(label = "Output format", info = "The file you can dowload", choices =
|
48 |
output_audio = gr.Audio(label="Generated Audio", type="filepath")
|
49 |
denoising_steps = gr.Slider(minimum=10, maximum=100, value=25, step=5, label="Steps", interactive=True)
|
50 |
guidance_scale = gr.Slider(minimum=1, maximum=10, value=3, step=0.1, label="Guidance Scale", interactive=True)
|
@@ -53,7 +54,7 @@ duration_scale = gr.Slider(minimum=1, maximum=30, value=10, step=1, label="Durat
|
|
53 |
# Gradio interface
|
54 |
gr_interface = gr.Interface(
|
55 |
fn=gradio_generate,
|
56 |
-
inputs=[input_text,
|
57 |
outputs=[output_audio],
|
58 |
title="TangoFlux: Aligning Diffusion-based Text-to-Audio Generations through Direct Preference Optimization",
|
59 |
description=description_text,
|
|
|
15 |
from diffusers.utils.torch_utils import randn_tensor
|
16 |
from tqdm import tqdm
|
17 |
from TangoFlux import TangoFluxInference
|
18 |
+
import torchaudio
|
19 |
|
20 |
|
21 |
|
|
|
45 |
"""
|
46 |
# Gradio input and output components
|
47 |
input_text = gr.Textbox(lines=2, label="Prompt")
|
48 |
+
#output_format = gr.Radio(label = "Output format", info = "The file you can dowload", choices = "wav"], value = "wav")
|
49 |
output_audio = gr.Audio(label="Generated Audio", type="filepath")
|
50 |
denoising_steps = gr.Slider(minimum=10, maximum=100, value=25, step=5, label="Steps", interactive=True)
|
51 |
guidance_scale = gr.Slider(minimum=1, maximum=10, value=3, step=0.1, label="Guidance Scale", interactive=True)
|
|
|
54 |
# Gradio interface
|
55 |
gr_interface = gr.Interface(
|
56 |
fn=gradio_generate,
|
57 |
+
inputs=[input_text, denoising_steps, guidance_scale,duration_scale],
|
58 |
outputs=[output_audio],
|
59 |
title="TangoFlux: Aligning Diffusion-based Text-to-Audio Generations through Direct Preference Optimization",
|
60 |
description=description_text,
|