sonalkum commited on
Commit
46f753f
·
verified ·
1 Parent(s): e8d4978

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -2
app.py CHANGED
@@ -86,17 +86,20 @@ def generate_audio(prompt, seconds_total=10, steps=100, cfg_scale=7):
86
  return unique_filename
87
 
88
  # Setting up the Gradio Interface
 
 
89
  interface = gr.Interface(
90
  fn=generate_audio,
91
  inputs=[
92
  gr.Textbox(label="Prompt", placeholder="Enter your text prompt here"),
93
  gr.Slider(0, 10, value=5, label="Duration in Seconds"),
94
- gr.Slider(10, 150, value=100, step=10, label="Number of Diffusion Steps"),
95
  gr.Slider(1, 10, value=7, step=0.1, label="CFG Scale")
96
  ],
97
  outputs=gr.Audio(type="filepath", label="Generated Audio"),
98
  title="Synthio Stable Audio Generator",
99
- description="Generate variable-length stereo audio at 44.1kHz from text prompts using Synthio's Stable Audio Open 1.0.")
 
100
 
101
  # Launch the Interface
102
  interface.launch()
 
86
  return unique_filename
87
 
88
  # Setting up the Gradio Interface
89
+ paper_link = "https://arxiv.org/pdf/2410.02056"
90
+ paper_text = "Synthio: Augmenting Small-Scale Audio Classification Datasets with Synthetic Data"
91
  interface = gr.Interface(
92
  fn=generate_audio,
93
  inputs=[
94
  gr.Textbox(label="Prompt", placeholder="Enter your text prompt here"),
95
  gr.Slider(0, 10, value=5, label="Duration in Seconds"),
96
+ gr.Slider(10, 250, value=150, step=10, label="Number of Diffusion Steps"),
97
  gr.Slider(1, 10, value=7, step=0.1, label="CFG Scale")
98
  ],
99
  outputs=gr.Audio(type="filepath", label="Generated Audio"),
100
  title="Synthio Stable Audio Generator",
101
+ description="A text-to-audio diffusion model (based on the Stable Audio DiT architecture) for generating variable length synthetic audios from text prompts at 44.1kHz.<br>"+
102
+ "This model was developed as part of the paper: " + f"<a href='{paper_link}'>{paper_text}</a> <br>")
103
 
104
  # Launch the Interface
105
  interface.launch()