Spaces:

yonigozlan
/

Segment-Anything-2-video-tracking

Running on Zero

App Files Files Community

yonigozlan HF Staff commited on Aug 12

Commit

41c6ac5

1 Parent(s): 02f1528

update

Browse files

Files changed (1) hide show

app.py +6 -9

app.py CHANGED Viewed

@@ -5,7 +5,6 @@ from typing import Optional
 import gradio as gr
 import numpy as np
 import torch
-from gradio.themes import Soft
 from PIL import Image, ImageDraw
 # Prefer local transformers in the workspace
@@ -233,6 +232,8 @@ def ensure_session_for_current_model() -> None:
             GLOBAL_STATE.inference_session = processor.init_video_session(
                 video=GLOBAL_STATE.video_frames,
                 inference_device=device,
             )
             GLOBAL_STATE.session_repo_id = desired_repo
@@ -277,6 +278,7 @@ def init_video_session(video: str | dict) -> tuple[AppState, int, int, Image.Ima
         video=frames,
         inference_device=device,
         video_storage_device="cpu",
     )
     GLOBAL_STATE.inference_session = inference_session
@@ -482,7 +484,7 @@ def on_image_click(
     return update_frame_display(GLOBAL_STATE, int(frame_idx))
-def propagate_masks(state: AppState, progress=gr.Progress()):
     if state is None or state.inference_session is None:
         yield "Load a video first."
         return
@@ -494,7 +496,6 @@ def propagate_masks(state: AppState, progress=gr.Progress()):
     total = max(1, GLOBAL_STATE.num_frames)
     processed = 0
-    # Initial status for first run visibility
     yield f"Propagating masks: {processed}/{total}"
     device_type = "cuda" if GLOBAL_STATE.device == "cuda" else "cpu"
@@ -516,8 +517,6 @@ def propagate_masks(state: AppState, progress=gr.Progress()):
             GLOBAL_STATE.composited_frames.pop(frame_idx, None)
             processed += 1
-            progress((processed, total), f"Propagating masks: {processed}/{total}")
-            # Stream status updates so users see progress text
             yield f"Propagating masks: {processed}/{total}"
     yield f"Propagated masks across {processed} frames for {len(inference_session.obj_ids)} objects."
@@ -563,9 +562,7 @@ def reset_session() -> tuple[AppState, Image.Image, int, int, str]:
     return GLOBAL_STATE, preview_img, slider_minmax, slider_value, status
-theme = Soft(primary_hue="indigo", secondary_hue="rose", neutral_hue="slate")
-with gr.Blocks(title="SAM2 Video (Transformers) - Interactive Segmentation", theme=theme) as demo:
     state = gr.State(GLOBAL_STATE)
     gr.Markdown("""
@@ -743,7 +740,7 @@ with gr.Blocks(title="SAM2 Video (Transformers) - Interactive Segmentation", the
     render_btn.click(_render_video, inputs=[state], outputs=[playback_video])
-    propagate_btn.click(propagate_masks, inputs=[state], outputs=[propagate_status], show_progress=True)
     reset_btn.click(
         reset_session,

 import gradio as gr
 import numpy as np
 import torch
 from PIL import Image, ImageDraw
 # Prefer local transformers in the workspace
             GLOBAL_STATE.inference_session = processor.init_video_session(
                 video=GLOBAL_STATE.video_frames,
                 inference_device=device,
+                video_storage_device="cpu",
+                torch_dtype=dtype,
             )
             GLOBAL_STATE.session_repo_id = desired_repo
         video=frames,
         inference_device=device,
         video_storage_device="cpu",
+        torch_dtype=dtype,
     )
     GLOBAL_STATE.inference_session = inference_session
     return update_frame_display(GLOBAL_STATE, int(frame_idx))
+def propagate_masks(state: AppState):
     if state is None or state.inference_session is None:
         yield "Load a video first."
         return
     total = max(1, GLOBAL_STATE.num_frames)
     processed = 0
     yield f"Propagating masks: {processed}/{total}"
     device_type = "cuda" if GLOBAL_STATE.device == "cuda" else "cpu"
             GLOBAL_STATE.composited_frames.pop(frame_idx, None)
             processed += 1
             yield f"Propagating masks: {processed}/{total}"
     yield f"Propagated masks across {processed} frames for {len(inference_session.obj_ids)} objects."
     return GLOBAL_STATE, preview_img, slider_minmax, slider_value, status
+with gr.Blocks(title="SAM2 Video (Transformers) - Interactive Segmentation", theme="shivi/calm_seafoam") as demo:
     state = gr.State(GLOBAL_STATE)
     gr.Markdown("""
     render_btn.click(_render_video, inputs=[state], outputs=[playback_video])
+    propagate_btn.click(propagate_masks, inputs=[state], outputs=[propagate_status])
     reset_btn.click(
         reset_session,