Spaces:

tahsinraiyan000
/

neuro-drive-video-model

Sleeping

App Files Files Community

tahsinraiyan000 commited on May 17

Commit

4544a40

verified ·

1 Parent(s): d50703f

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -38

app.py CHANGED Viewed

@@ -4,7 +4,7 @@ import numpy as np
 from collections import defaultdict
 from transformers import pipeline
-# Initialize the model
 detector = pipeline("object-detection", model="facebook/detr-resnet-101")
 # Global counter
@@ -12,63 +12,34 @@ object_counter = defaultdict(int)
 def process_video(video_path):
     cap = cv2.VideoCapture(video_path)
     while cap.isOpened():
         ret, frame = cap.read()
         if not ret:
             break
-        # Convert frame to RGB
         rgb_frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
-        # Detect objects
         results = detector(rgb_frame, threshold=0.7)
-        # Draw boxes and update counter
         for obj in results:
             label = obj["label"]
-            score = obj["score"]
-            box = obj["box"]
             object_counter[label] += 1
             xmin, ymin, xmax, ymax = int(box["xmin"]), int(box["ymin"]), int(box["xmax"]), int(box["ymax"])
             cv2.rectangle(frame, (xmin, ymin), (xmax, ymax), (0, 255, 0), 2)
-            cv2.putText(frame, f"{label} ({score:.2f})", (xmin, ymin-10), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 255, 0), 2)
-        # Display counter
         counter_text = "\n".join([f"{k}: {v}" for k, v in object_counter.items()])
         cv2.putText(frame, counter_text, (10, 30), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 0, 255), 2)
         yield cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
     cap.release()
-# Gradio UI with Reset Button
 with gr.Blocks() as demo:
-    gr.Markdown("# 🎥 Video Object Detection (DETR-R101)")
-    with gr.Row():
-        video_input = gr.Video(label="Upload Video")
-        video_output = gr.Image(label="Detections")
-    with gr.Row():
-        # Add the reset button here
-        reset_button = gr.Button("Reset Counter", variant="primary")
-    # Process video when uploaded
-    video_input.change(
-        fn=process_video,
-        inputs=video_input,
-        outputs=video_output
-    )
-    # Reset counter when button clicked
-    reset_button.click(
-        fn=lambda: object_counter.clear(),
-        inputs=None,
-        outputs=None,
-        queue=False  # No need to wait in queue
-    )
 demo.launch()

 from collections import defaultdict
 from transformers import pipeline
+# Initialize the model (now works with timm installed)
 detector = pipeline("object-detection", model="facebook/detr-resnet-101")
 # Global counter
 def process_video(video_path):
     cap = cv2.VideoCapture(video_path)
     while cap.isOpened():
         ret, frame = cap.read()
         if not ret:
             break
         rgb_frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
         results = detector(rgb_frame, threshold=0.7)
         for obj in results:
             label = obj["label"]
             object_counter[label] += 1
+            box = obj["box"]
             xmin, ymin, xmax, ymax = int(box["xmin"]), int(box["ymin"]), int(box["xmax"]), int(box["ymax"])
             cv2.rectangle(frame, (xmin, ymin), (xmax, ymax), (0, 255, 0), 2)
+            cv2.putText(frame, f"{label}", (xmin, ymin-10), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 255, 0), 2)
         counter_text = "\n".join([f"{k}: {v}" for k, v in object_counter.items()])
         cv2.putText(frame, counter_text, (10, 30), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 0, 255), 2)
         yield cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
     cap.release()
 with gr.Blocks() as demo:
+    gr.Markdown("# 🎥 Video Object Detection")
+    video_input = gr.Video(label="Upload Video")
+    video_output = gr.Image(label="Detections")
+    reset_button = gr.Button("Reset Counter")
+    video_input.change(process_video, video_input, video_output)
+    reset_button.click(lambda: object_counter.clear())
 demo.launch()