Spaces:

OpenSound
/

SoloSpeech

Running on Zero

App Files Files Community

OpenSound commited on 10 days ago

Commit

468a602

verified ·

1 Parent(s): 4d72af4

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -6

app.py CHANGED Viewed

@@ -264,27 +264,33 @@ css = """
 with gr.Blocks(css=css, theme=gr.themes.Soft()) as demo:
     with gr.Column(elem_id="col-container"):
         gr.Markdown("""
-            # 🎸 SoloSpeech: Enhancing Intelligibility and Quality in Target Speech Extraction through a Cascaded Generative Pipeline
             Extract the target voice from mixture speech given an enrollment speech.
-            Learn more about **SoloSpeech** on the [SoloSpeech Repo](https://github.com/WangHelin1997/SoloSpeech/).
         """)
         with gr.Tab("Target Speech Extraction"):
             with gr.Row():
                 mixture_input = gr.Audio(label="Upload Mixture Audio", type="filepath", value="test2.wav")
                 enroll_input = gr.Audio(label="Upload Enrollment Audio", type="filepath", value="test2_enroll.wav")
             with gr.Row():
                 demo_selector = gr.Dropdown(
                     label="Select Test Demo",
                     choices=[name for name, _, _ in demo_audio_files],
                     value="Test Demo 2"
                 )
-                extract_button = gr.Button("Extract", scale=1)
-            with gr.Row():
-                result = gr.Audio(label="Extracted Speech", type="numpy")
             # Update audio inputs when selecting from dropdown
             def update_audio_inputs(choice):

 with gr.Blocks(css=css, theme=gr.themes.Soft()) as demo:
     with gr.Column(elem_id="col-container"):
         gr.Markdown("""
+            # SoloSpeech: Enhancing Intelligibility and Quality in Target Speech Extraction through a Cascaded Generative Pipeline
             Extract the target voice from mixture speech given an enrollment speech.
+            Learn more about 🎯**SoloSpeech** on the [SoloSpeech Repo](https://github.com/WangHelin1997/SoloSpeech/).
+            Tip: Tip: To extract sound effects or music from audio, try using [SoloAudio](https://huggingface.co/spaces/OpenSound/SoloAudio).
         """)
         with gr.Tab("Target Speech Extraction"):
             with gr.Row():
                 mixture_input = gr.Audio(label="Upload Mixture Audio", type="filepath", value="test2.wav")
+            with gr.Row(equal_height=True):
                 enroll_input = gr.Audio(label="Upload Enrollment Audio", type="filepath", value="test2_enroll.wav")
+                extract_button = gr.Button("Extract", scale=1)
+                # extract_button = gr.Button("Extract", scale=1)
             with gr.Row():
+                result = gr.Audio(label="Extracted Speech", type="numpy")
+            with gr.Row(equal_height=True):
                 demo_selector = gr.Dropdown(
                     label="Select Test Demo",
                     choices=[name for name, _, _ in demo_audio_files],
                     value="Test Demo 2"
                 )
             # Update audio inputs when selecting from dropdown
             def update_audio_inputs(choice):