Spaces:
Runtime error
Runtime error
Commit
•
8436e2d
1
Parent(s):
b725215
added examples (#5)
Browse files- added examples (a9489b3016ac777b7bdcdc76141a19ac4c17c882)
Co-authored-by: Ameer Azam <[email protected]>
app.py
CHANGED
@@ -93,7 +93,49 @@ interface = gr.Interface(
|
|
93 |
],
|
94 |
outputs=gr.Audio(type="filepath", label="Generated Audio"),
|
95 |
title="Stable Audio Generator",
|
96 |
-
description="Generate variable-length stereo audio at 44.1kHz from text prompts using Stable Audio Open 1.0."
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
97 |
)
|
98 |
|
99 |
# Pre-load the model to avoid multiprocessing issues
|
|
|
93 |
],
|
94 |
outputs=gr.Audio(type="filepath", label="Generated Audio"),
|
95 |
title="Stable Audio Generator",
|
96 |
+
description="Generate variable-length stereo audio at 44.1kHz from text prompts using Stable Audio Open 1.0.",
|
97 |
+
examples=[
|
98 |
+
[
|
99 |
+
"Create a serene soundscape of a quiet beach at sunset.", # Text prompt
|
100 |
+
|
101 |
+
45, # Duration in Seconds
|
102 |
+
100, # Number of Diffusion Steps
|
103 |
+
10, # CFG Scale
|
104 |
+
],
|
105 |
+
[
|
106 |
+
"Generate an energetic and bustling city street scene with distant traffic and close conversations.", # Text prompt
|
107 |
+
|
108 |
+
30, # Duration in Seconds
|
109 |
+
120, # Number of Diffusion Steps
|
110 |
+
5, # CFG Scale
|
111 |
+
],
|
112 |
+
[
|
113 |
+
"Simulate a forest ambiance with birds chirping and wind rustling through the leaves.", # Text prompt
|
114 |
+
60, # Duration in Seconds
|
115 |
+
140, # Number of Diffusion Steps
|
116 |
+
7.5, # CFG Scale
|
117 |
+
],
|
118 |
+
[
|
119 |
+
"Recreate a gentle rainfall with distant thunder.", # Text prompt
|
120 |
+
|
121 |
+
35, # Duration in Seconds
|
122 |
+
110, # Number of Diffusion Steps
|
123 |
+
8, # CFG Scale
|
124 |
+
|
125 |
+
],
|
126 |
+
[
|
127 |
+
"Imagine a jazz cafe environment with soft music and ambient chatter.", # Text prompt
|
128 |
+
25, # Duration in Seconds
|
129 |
+
90, # Number of Diffusion Steps
|
130 |
+
6, # CFG Scale
|
131 |
+
|
132 |
+
],
|
133 |
+
["Rock beat played in a treated studio, session drumming on an acoustic kit.",
|
134 |
+
30, # Duration in Seconds
|
135 |
+
100, # Number of Diffusion Steps
|
136 |
+
7, # CFG Scale
|
137 |
+
|
138 |
+
]
|
139 |
)
|
140 |
|
141 |
# Pre-load the model to avoid multiprocessing issues
|