Spaces:

ameerazam08
/

stableaudio-open-1.0

Running on Zero

App Files Files Community

ameerazam08 commited on Jun 5

Commit

35fe8b4

•

1 Parent(s): ccf495a

Update app.py

Browse files

Files changed (1) hide show

app.py +56 -1

app.py CHANGED Viewed

@@ -98,7 +98,62 @@ interface = gr.Interface(
     ],
     outputs=gr.Audio(type="filepath", label="Generated Audio"),
     title="Stable Audio Generator",
-    description="Generate variable-length stereo audio at 44.1kHz from text prompts using Stable Audio Open 1.0."
 )
 # Pre-load the model to avoid multiprocessing issues

     ],
     outputs=gr.Audio(type="filepath", label="Generated Audio"),
     title="Stable Audio Generator",
+    description="Generate variable-length stereo audio at 44.1kHz from text prompts using Stable Audio Open 1.0.",
+    examples=[
+    [
+        "Create a serene soundscape of a quiet beach at sunset.",  # Text prompt
+        "dpmpp-2m-sde",  # Sampler type
+        45,  # Duration in Seconds
+        100,  # Number of Diffusion Steps
+        10,  # CFG Scale
+        0.5,  # Sigma min
+        800  # Sigma max
+    ],
+    [
+        "Generate an energetic and bustling city street scene with distant traffic and close conversations.",  # Text prompt
+        "k-heun",  # Sampler type
+        30,  # Duration in Seconds
+        120,  # Number of Diffusion Steps
+        5,  # CFG Scale
+        0.2,  # Sigma min
+        600  # Sigma max
+    ],
+    [
+        "Simulate a forest ambiance with birds chirping and wind rustling through the leaves.",  # Text prompt
+        "k-dpm-fast",  # Sampler type
+        60,  # Duration in Seconds
+        140,  # Number of Diffusion Steps
+        7.5,  # CFG Scale
+        0.3,  # Sigma min
+        700  # Sigma max
+    ],
+    [
+        "Recreate a gentle rainfall with distant thunder.",  # Text prompt
+        "dpmpp-3m-sde",  # Sampler type
+        35,  # Duration in Seconds
+        110,  # Number of Diffusion Steps
+        8,  # CFG Scale
+        0.1,  # Sigma min
+        500  # Sigma max
+    ],
+    [
+        "Imagine a jazz cafe environment with soft music and ambient chatter.",  # Text prompt
+        "k-lms",  # Sampler type
+        25,  # Duration in Seconds
+        90,  # Number of Diffusion Steps
+        6,  # CFG Scale
+        0.4,  # Sigma min
+        650  # Sigma max
+    ],
+    ["Rock beat played in a treated studio, session drumming on an acoustic kit.",
+      "k-lms",  # Sampler type
+        25,  # Duration in Seconds
+        90,  # Number of Diffusion Steps
+        6,  # CFG Scale
+        0.3,  # Sigma min
+        500  # Sigma max
+    ]
+    ]
 )
 # Pre-load the model to avoid multiprocessing issues