hungchiayu commited on
Commit
297dc79
·
1 Parent(s): e7cbc76

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -15,6 +15,7 @@ from typing import Union
15
  from diffusers.utils.torch_utils import randn_tensor
16
  from tqdm import tqdm
17
  from TangoFlux import TangoFluxInference
 
18
 
19
 
20
 
@@ -44,7 +45,7 @@ Generate audio using Tango2 by providing a text prompt. Tango2 was built from Ta
44
  """
45
  # Gradio input and output components
46
  input_text = gr.Textbox(lines=2, label="Prompt")
47
- output_format = gr.Radio(label = "Output format", info = "The file you can dowload", choices = ["mp3", "wav"], value = "wav")
48
  output_audio = gr.Audio(label="Generated Audio", type="filepath")
49
  denoising_steps = gr.Slider(minimum=10, maximum=100, value=25, step=5, label="Steps", interactive=True)
50
  guidance_scale = gr.Slider(minimum=1, maximum=10, value=3, step=0.1, label="Guidance Scale", interactive=True)
@@ -53,7 +54,7 @@ duration_scale = gr.Slider(minimum=1, maximum=30, value=10, step=1, label="Durat
53
  # Gradio interface
54
  gr_interface = gr.Interface(
55
  fn=gradio_generate,
56
- inputs=[input_text, output_format, denoising_steps, guidance_scale,duration_scale],
57
  outputs=[output_audio],
58
  title="TangoFlux: Aligning Diffusion-based Text-to-Audio Generations through Direct Preference Optimization",
59
  description=description_text,
 
15
  from diffusers.utils.torch_utils import randn_tensor
16
  from tqdm import tqdm
17
  from TangoFlux import TangoFluxInference
18
+ import torchaudio
19
 
20
 
21
 
 
45
  """
46
  # Gradio input and output components
47
  input_text = gr.Textbox(lines=2, label="Prompt")
48
+ #output_format = gr.Radio(label = "Output format", info = "The file you can dowload", choices = "wav"], value = "wav")
49
  output_audio = gr.Audio(label="Generated Audio", type="filepath")
50
  denoising_steps = gr.Slider(minimum=10, maximum=100, value=25, step=5, label="Steps", interactive=True)
51
  guidance_scale = gr.Slider(minimum=1, maximum=10, value=3, step=0.1, label="Guidance Scale", interactive=True)
 
54
  # Gradio interface
55
  gr_interface = gr.Interface(
56
  fn=gradio_generate,
57
+ inputs=[input_text, denoising_steps, guidance_scale,duration_scale],
58
  outputs=[output_audio],
59
  title="TangoFlux: Aligning Diffusion-based Text-to-Audio Generations through Direct Preference Optimization",
60
  description=description_text,