Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -86,17 +86,20 @@ def generate_audio(prompt, seconds_total=10, steps=100, cfg_scale=7):
|
|
86 |
return unique_filename
|
87 |
|
88 |
# Setting up the Gradio Interface
|
|
|
|
|
89 |
interface = gr.Interface(
|
90 |
fn=generate_audio,
|
91 |
inputs=[
|
92 |
gr.Textbox(label="Prompt", placeholder="Enter your text prompt here"),
|
93 |
gr.Slider(0, 10, value=5, label="Duration in Seconds"),
|
94 |
-
gr.Slider(10,
|
95 |
gr.Slider(1, 10, value=7, step=0.1, label="CFG Scale")
|
96 |
],
|
97 |
outputs=gr.Audio(type="filepath", label="Generated Audio"),
|
98 |
title="Synthio Stable Audio Generator",
|
99 |
-
description="
|
|
|
100 |
|
101 |
# Launch the Interface
|
102 |
interface.launch()
|
|
|
86 |
return unique_filename
|
87 |
|
88 |
# Setting up the Gradio Interface
|
89 |
+
paper_link = "https://arxiv.org/pdf/2410.02056"
|
90 |
+
paper_text = "Synthio: Augmenting Small-Scale Audio Classification Datasets with Synthetic Data"
|
91 |
interface = gr.Interface(
|
92 |
fn=generate_audio,
|
93 |
inputs=[
|
94 |
gr.Textbox(label="Prompt", placeholder="Enter your text prompt here"),
|
95 |
gr.Slider(0, 10, value=5, label="Duration in Seconds"),
|
96 |
+
gr.Slider(10, 250, value=150, step=10, label="Number of Diffusion Steps"),
|
97 |
gr.Slider(1, 10, value=7, step=0.1, label="CFG Scale")
|
98 |
],
|
99 |
outputs=gr.Audio(type="filepath", label="Generated Audio"),
|
100 |
title="Synthio Stable Audio Generator",
|
101 |
+
description="A text-to-audio diffusion model (based on the Stable Audio DiT architecture) for generating variable length synthetic audios from text prompts at 44.1kHz.<br>"+
|
102 |
+
"This model was developed as part of the paper: " + f"<a href='{paper_link}'>{paper_text}</a> <br>")
|
103 |
|
104 |
# Launch the Interface
|
105 |
interface.launch()
|