Spaces:
Running
Running
modify app
Browse files
app.py
CHANGED
@@ -156,23 +156,23 @@ def update_ito_output(all_results, selected_step):
|
|
156 |
with gr.Blocks() as demo:
|
157 |
gr.Markdown("# ITO-Master: Inference Time Optimization for Mastering Style Transfer")
|
158 |
with gr.Row():
|
159 |
-
gr.Markdown("
|
160 |
The mastering style transfer is performed by a differentiable audio processing model, and the predicted parameters are shown as the output. \
|
161 |
-
Perform mastering style transfer with an input source audio and a reference mastering style audio. On top of this result, you can perform ITO to optimize the reference embedding
|
162 |
-
gr.Image("ito_snow.png", width=
|
163 |
|
164 |
-
gr.Markdown("
|
165 |
|
166 |
with gr.Tab("Upload Audio"):
|
167 |
with gr.Row():
|
168 |
-
input_audio = gr.Audio(label=
|
169 |
-
reference_audio = gr.Audio(label="Reference Style Audio (
|
170 |
|
171 |
process_button = gr.Button("Process Mastering Style Transfer")
|
172 |
|
173 |
with gr.Row():
|
174 |
with gr.Column():
|
175 |
-
output_audio = gr.Audio(label="Output Audio (
|
176 |
normalized_input = gr.Audio(label="Normalized Source Audio", type='numpy')
|
177 |
param_output = gr.Textbox(label="Predicted Parameters", lines=5)
|
178 |
|
|
|
156 |
with gr.Blocks() as demo:
|
157 |
gr.Markdown("# ITO-Master: Inference Time Optimization for Mastering Style Transfer")
|
158 |
with gr.Row():
|
159 |
+
gr.Markdown("Interactive demo of Inference Time Optimization (ITO) for Music Mastering Style Transfer. \
|
160 |
The mastering style transfer is performed by a differentiable audio processing model, and the predicted parameters are shown as the output. \
|
161 |
+
Perform mastering style transfer with an input source audio and a reference mastering style audio. On top of this result, you can perform ITO to optimize the reference embedding z~ref~ $z_{ref}$ to further gain control over the output mastering style.")
|
162 |
+
gr.Image("ito_snow.png", width=300)
|
163 |
|
164 |
+
gr.Markdown("## Step 1: Mastering Style Transfer")
|
165 |
|
166 |
with gr.Tab("Upload Audio"):
|
167 |
with gr.Row():
|
168 |
+
input_audio = gr.Audio(label="Source Audio (x~in~ $x_{in}$)")
|
169 |
+
reference_audio = gr.Audio(label="Reference Style Audio (x~ref~ $x_{ref}$)")
|
170 |
|
171 |
process_button = gr.Button("Process Mastering Style Transfer")
|
172 |
|
173 |
with gr.Row():
|
174 |
with gr.Column():
|
175 |
+
output_audio = gr.Audio(label="Output Audio (y')", type='numpy')
|
176 |
normalized_input = gr.Audio(label="Normalized Source Audio", type='numpy')
|
177 |
param_output = gr.Textbox(label="Predicted Parameters", lines=5)
|
178 |
|