sam-audio-webui

Runtime error

App Files Files Community

Peter Shi commited on 8 days ago

Commit

3cc9650

1 Parent(s): a11009d

Simplify UI - remove tabs, fix example buttons

Browse files

Files changed (1) hide show

app.py +20 -31

app.py CHANGED Viewed

@@ -29,13 +29,11 @@ current_model_name = None
 model = None
 processor = None
-def load_model(model_name, progress=None):
     global current_model_name, model, processor
     model_id = MODELS.get(model_name, MODELS[DEFAULT_MODEL])
     if current_model_name == model_name and model is not None:
         return
-    if progress:
-        progress(0.1, desc="Loading model...")
     print(f"Loading {model_id}...")
     model = SAMAudio.from_pretrained(model_id).to(device).eval()
     processor = SAMAudioProcessor.from_pretrained(model_id)
@@ -83,16 +81,6 @@ def separate_audio(model_name, file_path, text_prompt, progress=gr.Progress()):
         traceback.print_exc()
         return None, None, f"❌ Error: {str(e)}"
-def process_audio(model_name, audio_path, prompt, progress=gr.Progress()):
-    if not audio_path:
-        return None, None, "❌ Please upload an audio file."
-    return separate_audio(model_name, audio_path, prompt, progress)
-def process_video(model_name, video_path, prompt, progress=gr.Progress()):
-    if not video_path:
-        return None, None, "❌ Please upload a video file."
-    return separate_audio(model_name, video_path, prompt, progress)
 # Build Interface
 with gr.Blocks(title="SAM-Audio Demo") as demo:
     gr.Markdown(
@@ -110,12 +98,11 @@ with gr.Blocks(title="SAM-Audio Demo") as demo:
                 label="Model"
             )
-            tabs = gr.Tabs()
-            with tabs:
-                with gr.TabItem("🎵 Audio", id=0):
-                    input_audio = gr.Audio(label="Upload Audio", type="filepath")
-                with gr.TabItem("🎬 Video", id=1):
-                    input_video = gr.Video(label="Upload Video")
             text_prompt = gr.Textbox(
                 label="Text Prompt",
@@ -132,7 +119,7 @@ with gr.Blocks(title="SAM-Audio Demo") as demo:
     gr.Markdown("---")
     gr.Markdown("### 🎬 Demo Examples")
-    gr.Markdown("Click to load example, then click 'Isolate Sound' to process:")
     with gr.Row():
         if os.path.exists(EXAMPLE_FILE):
@@ -140,28 +127,30 @@ with gr.Blocks(title="SAM-Audio Demo") as demo:
             example_btn2 = gr.Button("🎤 Woman Speaking")
             example_btn3 = gr.Button("🎵 Background Music")
-    # Main process button - check which tab has content
     run_btn.click(
-        fn=lambda m, a, v, p: process_audio(m, a, p) if a else process_video(m, v, p),
         inputs=[model_selector, input_audio, input_video, text_prompt],
         outputs=[output_target, output_residual, status_output]
     )
-    # Example buttons - only fill in data, switch to video tab
     if os.path.exists(EXAMPLE_FILE):
         example_btn1.click(
-            fn=lambda: (EXAMPLE_FILE, "A man speaking", gr.Tabs(selected=1)),
-            outputs=[input_video, text_prompt, tabs]
         )
         example_btn2.click(
-            fn=lambda: (EXAMPLE_FILE, "A woman speaking", gr.Tabs(selected=1)),
-            outputs=[input_video, text_prompt, tabs]
         )
         example_btn3.click(
-            fn=lambda: (EXAMPLE_FILE, "Background music", gr.Tabs(selected=1)),
-            outputs=[input_video, text_prompt, tabs]
         )
 if __name__ == "__main__":

 model = None
 processor = None
+def load_model(model_name):
     global current_model_name, model, processor
     model_id = MODELS.get(model_name, MODELS[DEFAULT_MODEL])
     if current_model_name == model_name and model is not None:
         return
     print(f"Loading {model_id}...")
     model = SAMAudio.from_pretrained(model_id).to(device).eval()
     processor = SAMAudioProcessor.from_pretrained(model_id)
         traceback.print_exc()
         return None, None, f"❌ Error: {str(e)}"
 # Build Interface
 with gr.Blocks(title="SAM-Audio Demo") as demo:
     gr.Markdown(
                 label="Model"
             )
+            gr.Markdown("#### Upload Audio")
+            input_audio = gr.Audio(label="Audio File", type="filepath")
+            gr.Markdown("#### Or Upload Video")
+            input_video = gr.Video(label="Video File")
             text_prompt = gr.Textbox(
                 label="Text Prompt",
     gr.Markdown("---")
     gr.Markdown("### 🎬 Demo Examples")
+    gr.Markdown("Click to load example video and prompt:")
     with gr.Row():
         if os.path.exists(EXAMPLE_FILE):
             example_btn2 = gr.Button("🎤 Woman Speaking")
             example_btn3 = gr.Button("🎵 Background Music")
+    # Main process button
+    def process(model_name, audio_path, video_path, prompt, progress=gr.Progress()):
+        file_path = video_path if video_path else audio_path
+        return separate_audio(model_name, file_path, prompt, progress)
     run_btn.click(
+        fn=process,
         inputs=[model_selector, input_audio, input_video, text_prompt],
         outputs=[output_target, output_residual, status_output]
     )
+    # Example buttons - just fill the prompt, user clicks button to process
     if os.path.exists(EXAMPLE_FILE):
         example_btn1.click(
+            fn=lambda: (EXAMPLE_FILE, "A man speaking"),
+            outputs=[input_video, text_prompt]
         )
         example_btn2.click(
+            fn=lambda: (EXAMPLE_FILE, "A woman speaking"),
+            outputs=[input_video, text_prompt]
         )
         example_btn3.click(
+            fn=lambda: (EXAMPLE_FILE, "Background music"),
+            outputs=[input_video, text_prompt]
         )
 if __name__ == "__main__":