Spaces:

hadiyya
/

MC1-Gradio-Assignment

Runtime error

App Files Files Community

hadiyya commited on May 5

Commit

fccb324

verified ·

1 Parent(s): 98d6c17

Define stream_object_detection

Browse files

Files changed (1) hide show

app.py +75 -3

app.py CHANGED Viewed

@@ -1,3 +1,77 @@
 import gradio as gr
 with gr.Blocks() as app:
@@ -20,11 +94,9 @@ with gr.Blocks() as app:
         with gr.Column():
             output_video = gr.Video(label="Processed Video", streaming=True, autoplay=True)
-    video.upload(
         fn=stream_object_detection,
         inputs=[video, conf_threshold],
         outputs=[output_video],
     )
-    # This is from: https://www.gradio.app/guides/object-detection-from-video

+import spaces
+import cv2
+from PIL import Image
+import torch
+import time
+import numpy as np
+import uuid
+from draw_boxes import draw_bounding_boxes
+from transformers import AutoImageProcessor, AutoModelForObjectDetection  # Added import
+SUBSAMPLE = 2
+# Initialize image processor and model
+image_processor = AutoImageProcessor.from_pretrained("PekingU/rtdetr_r101vd_coco_o365")
+model = AutoModelForObjectDetection.from_pretrained("PekingU/rtdetr_r101vd_coco_o365").to("cuda")
+@spaces.GPU
+def stream_object_detection(video, conf_threshold):
+    cap = cv2.VideoCapture(video)
+    video_codec = cv2.VideoWriter_fourcc(*"mp4v") # type: ignore
+    fps = int(cap.get(cv2.CAP_PROP_FPS))
+    desired_fps = fps // SUBSAMPLE
+    width  = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH)) // 2
+    height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT)) // 2
+    iterating, frame = cap.read()
+    n_frames = 0
+    output_video_name = f"output_{uuid.uuid4()}.mp4"
+    # Output Video
+    output_video = cv2.VideoWriter(output_video_name, video_codec, desired_fps, (width, height)) # type: ignore
+    batch = []
+    while iterating:
+        frame = cv2.resize(frame, (0, 0), fx=0.5, fy=0.5)
+        frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+        if n_frames % SUBSAMPLE == 0:
+            batch.append(frame)
+        if len(batch) == 2 * desired_fps:
+            inputs = image_processor(images=batch, return_tensors="pt").to("cuda")
+            with torch.no_grad():
+                outputs = model(**inputs)
+            boxes = image_processor.post_process_object_detection(
+                outputs,
+                target_sizes=torch.tensor([(height, width)] * len(batch)),
+                threshold=conf_threshold)
+            for i, (array, box) in enumerate(zip(batch, boxes)):
+                pil_image = draw_bounding_boxes(Image.fromarray(array), box, model, conf_threshold)
+                frame = np.array(pil_image)
+                # Convert RGB to BGR
+                frame = frame[:, :, ::-1].copy()
+                output_video.write(frame)
+            batch = []
+            output_video.release()
+            yield output_video_name
+            output_video_name = f"output_{uuid.uuid4()}.mp4"
+            output_video = cv2.VideoWriter(output_video_name, video_codec, desired_fps, (width, height)) # type: ignore
+        iterating, frame = cap.read()
+        n_frames += 1
+    cap.release()
+    output_video.release()
 import gradio as gr
 with gr.Blocks() as app:
         with gr.Column():
             output_video = gr.Video(label="Processed Video", streaming=True, autoplay=True)
+    video.change(
         fn=stream_object_detection,
         inputs=[video, conf_threshold],
         outputs=[output_video],
     )