Spaces:
Runtime error
Runtime error
Commit
·
297dc79
1
Parent(s):
e7cbc76
Update app.py
Browse files
app.py
CHANGED
|
@@ -15,6 +15,7 @@ from typing import Union
|
|
| 15 |
from diffusers.utils.torch_utils import randn_tensor
|
| 16 |
from tqdm import tqdm
|
| 17 |
from TangoFlux import TangoFluxInference
|
|
|
|
| 18 |
|
| 19 |
|
| 20 |
|
|
@@ -44,7 +45,7 @@ Generate audio using Tango2 by providing a text prompt. Tango2 was built from Ta
|
|
| 44 |
"""
|
| 45 |
# Gradio input and output components
|
| 46 |
input_text = gr.Textbox(lines=2, label="Prompt")
|
| 47 |
-
output_format = gr.Radio(label = "Output format", info = "The file you can dowload", choices =
|
| 48 |
output_audio = gr.Audio(label="Generated Audio", type="filepath")
|
| 49 |
denoising_steps = gr.Slider(minimum=10, maximum=100, value=25, step=5, label="Steps", interactive=True)
|
| 50 |
guidance_scale = gr.Slider(minimum=1, maximum=10, value=3, step=0.1, label="Guidance Scale", interactive=True)
|
|
@@ -53,7 +54,7 @@ duration_scale = gr.Slider(minimum=1, maximum=30, value=10, step=1, label="Durat
|
|
| 53 |
# Gradio interface
|
| 54 |
gr_interface = gr.Interface(
|
| 55 |
fn=gradio_generate,
|
| 56 |
-
inputs=[input_text,
|
| 57 |
outputs=[output_audio],
|
| 58 |
title="TangoFlux: Aligning Diffusion-based Text-to-Audio Generations through Direct Preference Optimization",
|
| 59 |
description=description_text,
|
|
|
|
| 15 |
from diffusers.utils.torch_utils import randn_tensor
|
| 16 |
from tqdm import tqdm
|
| 17 |
from TangoFlux import TangoFluxInference
|
| 18 |
+
import torchaudio
|
| 19 |
|
| 20 |
|
| 21 |
|
|
|
|
| 45 |
"""
|
| 46 |
# Gradio input and output components
|
| 47 |
input_text = gr.Textbox(lines=2, label="Prompt")
|
| 48 |
+
#output_format = gr.Radio(label = "Output format", info = "The file you can dowload", choices = "wav"], value = "wav")
|
| 49 |
output_audio = gr.Audio(label="Generated Audio", type="filepath")
|
| 50 |
denoising_steps = gr.Slider(minimum=10, maximum=100, value=25, step=5, label="Steps", interactive=True)
|
| 51 |
guidance_scale = gr.Slider(minimum=1, maximum=10, value=3, step=0.1, label="Guidance Scale", interactive=True)
|
|
|
|
| 54 |
# Gradio interface
|
| 55 |
gr_interface = gr.Interface(
|
| 56 |
fn=gradio_generate,
|
| 57 |
+
inputs=[input_text, denoising_steps, guidance_scale,duration_scale],
|
| 58 |
outputs=[output_audio],
|
| 59 |
title="TangoFlux: Aligning Diffusion-based Text-to-Audio Generations through Direct Preference Optimization",
|
| 60 |
description=description_text,
|