Spaces:
Sleeping
Sleeping
import gradio as gr | |
import torch | |
import cv2 | |
import numpy as np | |
import time | |
from ultralytics import YOLO | |
import spaces | |
import os | |
class CrowdDetection: | |
def __init__(self, model_path="yolov8n.pt"): | |
self.model_path = model_path | |
def crowd_detect(self, video_path): | |
try: | |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu") | |
if not os.path.exists(self.model_path): | |
model = YOLO("yolov8n.pt") | |
model.save(self.model_path) | |
else: | |
model = YOLO(self.model_path) | |
model.to(device) | |
cap = cv2.VideoCapture(video_path) | |
if not cap.isOpened(): | |
raise ValueError(f"❌ Failed to open video: {video_path}") | |
fps = int(cap.get(cv2.CAP_PROP_FPS)) | |
width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH)) | |
height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT)) | |
output_path = "output_crowd.mp4" | |
fourcc = cv2.VideoWriter_fourcc(*"mp4v") | |
out = cv2.VideoWriter(output_path, fourcc, fps, (width, height)) | |
if not out.isOpened(): | |
cap.release() | |
raise ValueError(f"❌ Failed to initialize video writer") | |
CROWD_THRESHOLD = 10 | |
frame_count = 0 | |
while cap.isOpened(): | |
ret, frame = cap.read() | |
if not ret: | |
break | |
frame_count += 1 | |
results = model(frame) | |
person_count = sum(1 for result in results for cls in result.boxes.cls.cpu().numpy() if int(cls) == 0) | |
for result in results: | |
boxes = result.boxes.xyxy.cpu().numpy() | |
classes = result.boxes.cls.cpu().numpy() | |
for box, cls in zip(boxes, classes): | |
if int(cls) == 0: | |
x1, y1, x2, y2 = map(int, box) | |
cv2.rectangle(frame, (x1, y1), (x2, y2), (0, 255, 0), 2) | |
cv2.putText(frame, "Person", (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 0), 2) | |
alert_text = "Crowd Alert!" if person_count > CROWD_THRESHOLD else f"People: {person_count}" | |
cv2.putText(frame, alert_text, (50, 50), cv2.FONT_HERSHEY_SIMPLEX, 1, | |
(0, 0, 255) if person_count > CROWD_THRESHOLD else (0, 255, 0), 2) | |
out.write(frame) | |
cap.release() | |
out.release() | |
if frame_count == 0 or not os.path.exists(output_path): | |
raise ValueError("❌ Processing failed: No frames processed or output not created") | |
return output_path | |
except Exception as e: | |
raise ValueError(f"Error in crowd_detection: {str(e)}") | |
class PeopleTracking: | |
def __init__(self, yolo_model_path="yolov8n.pt"): | |
self.model_path = yolo_model_path | |
def people_tracking(self, video_path): | |
try: | |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu") | |
if not os.path.exists(self.model_path): | |
model = YOLO("yolov8n.pt") | |
model.save(self.model_path) | |
else: | |
model = YOLO(self.model_path) | |
model.to(device) | |
cap = cv2.VideoCapture(video_path) | |
if not cap.isOpened(): | |
raise ValueError(f"❌ Failed to open video: {video_path}") | |
fps = int(cap.get(cv2.CAP_PROP_FPS)) | |
width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH)) | |
height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT)) | |
output_path = "output_tracking.mp4" | |
out = cv2.VideoWriter(output_path, cv2.VideoWriter_fourcc(*"mp4v"), fps, (width, height)) | |
if not out.isOpened(): | |
cap.release() | |
raise ValueError(f"❌ Failed to initialize video writer") | |
while cap.isOpened(): | |
ret, frame = cap.read() | |
if not ret: | |
break | |
results = model.track(frame, persist=True) | |
for result in results: | |
boxes = result.boxes.xyxy.cpu().numpy() | |
classes = result.boxes.cls.cpu().numpy() | |
ids = result.boxes.id.cpu().numpy() if result.boxes.id is not None else np.arange(len(boxes)) | |
for box, cls, obj_id in zip(boxes, classes, ids): | |
if int(cls) == 0: | |
x1, y1, x2, y2 = map(int, box) | |
cv2.rectangle(frame, (x1, y1), (x2, y2), (255, 0, 0), 2) | |
cv2.putText(frame, f"ID {int(obj_id)}", (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (255, 0, 0), 2) | |
out.write(frame) | |
cap.release() | |
out.release() | |
if not os.path.exists(output_path): | |
raise ValueError("❌ Processing failed") | |
return output_path | |
except Exception as e: | |
raise ValueError(f"Error in people_tracking: {str(e)}") | |
class FallDetection: | |
def __init__(self, yolo_model_path="yolov8l.pt"): | |
self.model_path = yolo_model_path | |
def fall_detect(self, video_path): | |
try: | |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu") | |
if not os.path.exists(self.model_path): | |
model = YOLO("yolov8l.pt") | |
model.save(self.model_path) | |
else: | |
model = YOLO(self.model_path) | |
model.to(device) | |
cap = cv2.VideoCapture(video_path) | |
if not cap.isOpened(): | |
raise ValueError(f"❌ Failed to open video: {video_path}") | |
fps = int(cap.get(cv2.CAP_PROP_FPS)) | |
width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH)) | |
height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT)) | |
output_path = "output_fall.mp4" | |
out = cv2.VideoWriter(output_path, cv2.VideoWriter_fourcc(*"mp4v"), fps, (width, height)) | |
if not out.isOpened(): | |
cap.release() | |
raise ValueError(f"❌ Failed to initialize video writer") | |
while cap.isOpened(): | |
ret, frame = cap.read() | |
if not ret: | |
break | |
results = model(frame) | |
for result in results: | |
boxes = result.boxes.xyxy.cpu().numpy() | |
classes = result.boxes.cls.cpu().numpy() | |
for box, cls in zip(boxes, classes): | |
if int(cls) == 0: | |
x1, y1, x2, y2 = map(int, box) | |
width = x2 - x1 | |
height = y2 - y1 | |
aspect_ratio = width / height if height > 0 else float('inf') | |
if aspect_ratio > 0.55: | |
color = (0, 0, 255) | |
label = "FALL DETECTED" | |
else: | |
color = (0, 255, 0) | |
label = "Standing" | |
cv2.rectangle(frame, (x1, y1), (x2, y2), color, 2) | |
cv2.putText(frame, label, (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.5, color, 2) | |
out.write(frame) | |
cap.release() | |
out.release() | |
if not os.path.exists(output_path): | |
raise ValueError("❌ Processing failed") | |
return output_path | |
except Exception as e: | |
raise ValueError(f"Error in fall_detection: {str(e)}") | |
class FightDetection: | |
def __init__(self, yolo_model_path="yolov8n-pose.pt"): | |
self.model_path = yolo_model_path | |
def fight_detect(self, video_path): | |
try: | |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu") | |
if not os.path.exists(self.model_path): | |
model = YOLO("yolov8n-pose.pt") | |
model.save(self.model_path) | |
else: | |
model = YOLO(self.model_path) | |
model.to(device) | |
cap = cv2.VideoCapture(video_path) | |
if not cap.isOpened(): | |
raise ValueError(f"❌ Failed to open video: {video_path}") | |
fps = int(cap.get(cv2.CAP_PROP_FPS)) | |
width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH)) | |
height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT)) | |
output_path = "output_fight.mp4" | |
out = cv2.VideoWriter(output_path, cv2.VideoWriter_fourcc(*"mp4v"), fps, (width, height)) | |
if not out.isOpened(): | |
cap.release() | |
raise ValueError(f"❌ Failed to initialize video writer") | |
while cap.isOpened(): | |
ret, frame = cap.read() | |
if not ret: | |
break | |
results = model.track(frame, persist=True) | |
fight_detected = False | |
person_count = 0 | |
for result in results: | |
keypoints = result.keypoints.xy.cpu().numpy() if result.keypoints else [] | |
boxes = result.boxes.xyxy.cpu().numpy() if result.boxes else [] | |
classes = result.boxes.cls.cpu().numpy() if result.boxes else [] | |
for box, kp, cls in zip(boxes, keypoints, classes): | |
if int(cls) == 0: | |
person_count += 1 | |
x1, y1, x2, y2 = map(int, box) | |
if len(kp) > 7 and (kp[5][1] < y1 + (y2 - y1) * 0.3 or kp[7][1] < y1 + (y2 - y1) * 0.3): | |
fight_detected = True | |
cv2.rectangle(frame, (x1, y1), (x2, y2), (0, 0, 255) if fight_detected else (0, 255, 0), 2) | |
label = "FIGHT DETECTED" if fight_detected else "Person" | |
cv2.putText(frame, label, (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.5, | |
(0, 0, 255) if fight_detected else (0, 255, 0), 2) | |
if fight_detected and person_count > 1: | |
cv2.putText(frame, "FIGHT ALERT!", (50, 50), cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2) | |
out.write(frame) | |
cap.release() | |
out.release() | |
if not os.path.exists(output_path): | |
raise ValueError("❌ Processing failed") | |
return output_path | |
except Exception as e: | |
raise ValueError(f"Error in fight_detection: {str(e)}") | |
class IntrusionDetection: | |
def __init__(self, model_path="yolov8n.pt", max_intrusion_time=300, iou_threshold=0.5, conf_threshold=0.5): | |
self.model_path = model_path | |
self.max_intrusion_time = max_intrusion_time | |
self.iou_threshold = iou_threshold | |
self.conf_threshold = conf_threshold | |
def intrusion_detect(self, video_path): | |
try: | |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu") | |
if not os.path.exists(self.model_path): | |
model = YOLO("yolov8n.pt") | |
model.save(self.model_path) | |
else: | |
model = YOLO(self.model_path) | |
model.to(device) | |
cap = cv2.VideoCapture(video_path) | |
if not cap.isOpened(): | |
raise ValueError(f"❌ Failed to open video: {video_path}") | |
fps = int(cap.get(cv2.CAP_PROP_FPS)) | |
width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH)) | |
height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT)) | |
output_path = "output_intrusion.mp4" | |
fourcc = cv2.VideoWriter_fourcc(*"mp4v") | |
out = cv2.VideoWriter(output_path, fourcc, fps, (width, height)) | |
if not out.isOpened(): | |
cap.release() | |
raise ValueError(f"❌ Failed to initialize video writer") | |
frame_count = 0 | |
while cap.isOpened(): | |
ret, frame = cap.read() | |
if not ret: | |
break | |
frame_count += 1 | |
results = model(frame) | |
for result in results: | |
boxes = result.boxes.xyxy.cpu().numpy() | |
classes = result.boxes.cls.cpu().numpy() | |
confidences = result.boxes.conf.cpu().numpy() | |
for box, cls, conf in zip(boxes, classes, confidences): | |
if int(cls) == 0 and conf > self.conf_threshold: # Person class with confidence filter | |
x1, y1, x2, y2 = map(int, box) | |
label = "Intruder" | |
color = (0, 0, 255) | |
cv2.rectangle(frame, (x1, y1), (x2, y2), color, 2) | |
cv2.putText(frame, label, (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.5, color, 2) | |
out.write(frame) | |
cap.release() | |
out.release() | |
if frame_count == 0 or not os.path.exists(output_path): | |
raise ValueError("❌ Processing failed: No frames processed or output not created") | |
return output_path | |
except Exception as e: | |
raise ValueError(f"Error in detect_intrusion: {str(e)}") | |
import cv2 | |
import numpy as np | |
from ultralytics import YOLO | |
from shapely.geometry import Point, Polygon | |
import time | |
class LoiteringDetector: | |
def __init__(self, model_path='loitering_model.pt'): | |
self.model = YOLO(model_path) | |
def loitering_detect(self, video_path, area): | |
# Create polygon zone | |
time_threshold = 7 | |
detection_threshold = 0.6 | |
zone_points = None | |
if area == '131': | |
zone_points = [(842//1.5, 514//1.7), (686//1.5, 290//1.7), (775//1.5, 279//1.7), (961//1.5, 488//1.7)] | |
elif area == '145': | |
zone_points = [(153, 850), (139, 535), (239, 497), (291, 857)] | |
zone = Polygon(zone_points) | |
# Open video | |
cap = cv2.VideoCapture(video_path) | |
width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH) * 0.5) | |
height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT) * 0.5) | |
fps = int(cap.get(cv2.CAP_PROP_FPS)) | |
# Create video writer | |
output_path = os.path.join(tempfile.gettempdir(), "loitering_video.mp4") | |
fourcc = cv2.VideoWriter_fourcc(*'mp4v') | |
out = cv2.VideoWriter(output_path, fourcc, fps, (width, height)) | |
while cap.isOpened(): | |
ret, frame = cap.read() | |
if not ret: | |
break | |
frame = cv2.resize(frame, (width, height)) | |
# Perform object detection and tracking | |
results = self.model.track(frame, persist=True, classes=[0], conf=detection_threshold) # 0 is the class ID for person | |
# List to store time information for display | |
time_display = [] | |
if results[0].boxes.id is not None: | |
boxes = results[0].boxes.xyxy.cpu().numpy().astype(int) | |
ids = results[0].boxes.id.cpu().numpy().astype(int) | |
for box, id in zip(boxes, ids): | |
x1, y1, x2, y2 = box | |
center = Point((x1 + x2) / 2, (y1 + y2) / 2) | |
if id not in person_info: | |
person_info[id] = {'in_zone': False, 'start_time': None, 'duration': 0} | |
if zone.contains(center): | |
if not person_info[id]['in_zone']: | |
person_info[id]['in_zone'] = True | |
person_info[id]['start_time'] = time.time() | |
person_info[id]['duration'] = time.time() - person_info[id]['start_time'] | |
if person_info[id]['duration'] > time_threshold: | |
color = (0, 0, 255) # Red for loitering | |
else: | |
color = (0, 255, 0) # Green for in zone | |
time_display.append(f"ID: {id}, Time: {person_info[id]['duration']:.2f}s") | |
else: | |
person_info[id]['in_zone'] = False | |
person_info[id]['start_time'] = None | |
person_info[id]['duration'] = 0 | |
color = (255, 0, 0) # Blue for outside zone | |
cv2.rectangle(frame, (x1, y1), (x2, y2), color, 2) | |
cv2.putText(frame, f"ID: {id}", (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.5, color, 2) | |
# Draw polygon zone | |
cv2.polylines(frame, [np.array(zone_points, np.int32)], True, (255, 255, 0), 2) | |
# Display time information in top left | |
for i, text in enumerate(time_display): | |
cv2.putText(frame, text, (10, 30 + i * 30), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (255, 255, 255), 2) | |
out.write(frame) | |
cap.release() | |
out.release() | |
return output_path | |
def process_video(feature, video, area=None): | |
detectors = { | |
"Crowd Detection": CrowdDetection, | |
"People Tracking": PeopleTracking, | |
"Fall Detection": FallDetection, | |
"Fight Detection": FightDetection, | |
"Intrusion Detection": IntrusionDetection, | |
"Loitering Detection": LoiteringDetection | |
} | |
try: | |
detector = detectors[feature]() | |
method_name = feature.lower().replace(" ", "_").replace("detection", "detect") # Ensures correct method name | |
if feature == "Loitering Detection": | |
output_path = detector.detect_loitering(video, area) # Pass area if required | |
else: | |
output_path = getattr(detector, method_name)(video) | |
return f"{feature} completed successfully", output_path | |
except Exception as e: | |
return f"Error: {str(e)}", None | |
# Gradio Interface with additional input for Loitering Detection | |
interface = gr.Interface( | |
fn=process_video, | |
inputs=[ | |
gr.Dropdown(choices=[ | |
"Crowd Detection", "People Tracking", "Fall Detection", | |
"Fight Detection", "Intrusion Detection", "Loitering Detection" | |
], label="Select Feature"), | |
gr.Video(label="Upload Video"), | |
gr.Textbox(label="Loitering Area (131 or 145)") # Can be replaced with a drawing tool | |
], | |
outputs=[ | |
gr.Textbox(label="Status"), | |
gr.Video(label="Processed Video") | |
], | |
title="YOLOv8 Multitask Video Processing", | |
description="Select a feature to process your video: Crowd Detection, People Tracking, Fall Detection, or Fight Detection." | |
) | |
if __name__ == "__main__": | |
interface.launch(debug=True) | |