Spaces:

SamDaLamb
/

ValorantTracker

Running

App Files Files Community

SamDaLamb commited on Feb 12

Commit

5a89f37

verified ·

1 Parent(s): b5b4697

Update app.py

Browse files

Files changed (1) hide show

app.py +143 -59

app.py CHANGED Viewed

@@ -8,73 +8,157 @@ import gradio as gr
 import numpy as np
 import requests
 from PIL import Image
 import torch
 from torchvision import transforms
 from PIL import Image
 # Load the YOLO model
-model_path = "./best-model.torchscript"
 model = torch.jit.load(model_path, map_location=torch.device("cpu"))
 model.eval()
-# Initialize your pose estimation model
-yolo_nas_pose = models.get("best.pt",
-                           num_classes=1,
-                           checkpoint_path="./best.pt")
-def process_and_predict(url=None,
-                        image=None,
-                        confidence=0.5,
-                        iou=0.5):
-    # If a URL is provided, use it directly for prediction
-    if url is not None and url.strip() != "":
-        response = requests.get(url)
-        image = Image.open(BytesIO(response.content))
-        image = np.array(image)
-        result = yolo_nas_pose.predict(image, conf=confidence,iou=iou)
-    # If a file is uploaded, read it, convert it to a numpy array and use it for prediction
-    elif image is not None:
-        result = yolo_nas_pose.predict(image, conf=confidence,iou=iou)
-    else:
-        return None  # If no input is provided, return None
-    # Extract prediction data
-    image_prediction = result._images_prediction_lst[0]
-    pose_data = image_prediction.prediction
-    # Visualize the prediction
-    output_image = PoseVisualization.draw_poses(
-        image=image_prediction.image,
-        poses=pose_data.poses,
-        boxes=pose_data.bboxes_xyxy,
-        scores=pose_data.scores,
-        is_crowd=None,
-        edge_links=pose_data.edge_links,
-        edge_colors=pose_data.edge_colors,
-        keypoint_colors=pose_data.keypoint_colors,
-        joint_thickness=2,
-        box_thickness=2,
-        keypoint_radius=5
-    )
-    blank_image = np.zeros_like(image_prediction.image)
-    skeleton_image = PoseVisualization.draw_poses(
-    image=blank_image,
-    poses=pose_data.poses,
-    boxes=pose_data.bboxes_xyxy,
-    scores=pose_data.scores,
-    is_crowd=None,
-    edge_links=pose_data.edge_links,
-    edge_colors=pose_data.edge_colors,
-    keypoint_colors=pose_data.keypoint_colors,
-    joint_thickness=2,
-    box_thickness=2,
-    keypoint_radius=5
-)
-    return output_image, skeleton_image
 def greet(name):
     return "Hello " + name + "!!"

 import numpy as np
 import requests
 from PIL import Image
+import gradio as gr
+import cv2
+import tempfile
+import numpy as np
 import torch
 from torchvision import transforms
 from PIL import Image
+import matplotlib.pyplot as plt
+from io import BytesIO
 # Load the YOLO model
+model_path = "./best.pt"
 model = torch.jit.load(model_path, map_location=torch.device("cpu"))
 model.eval()
+transform = transforms.Compose([
+    transforms.Resize((640, 640)),
+    transforms.ToTensor(),
+])
+OBJECT_NAMES = ['enemies']
+def detect_objects_in_image(image):
+    img_tensor = transform(image).unsqueeze(0)
+    orig_w, orig_h = image.size
+    with torch.no_grad():
+        pred = model(img_tensor)[0]
+    if isinstance(pred[0], torch.Tensor):
+        pred = [p.cpu().numpy() for p in pred]
+    pred = np.concatenate(pred, axis=0)
+    conf_thres = 0.25
+    mask = pred[:, 4] > conf_thres
+    pred = pred[mask]
+    if len(pred) == 0:
+        return Image.fromarray(np.array(image)), None  # Return only image and None for graph
+    boxes, scores, class_probs = pred[:, :4], pred[:, 4], pred[:, 5:]
+    class_ids = np.argmax(class_probs, axis=1)
+    boxes[:, 0] = boxes[:, 0] - (boxes[:, 2] / 2)
+    boxes[:, 1] = boxes[:, 1] - (boxes[:, 3] / 2)
+    boxes[:, 2] = boxes[:, 0] + boxes[:, 2]
+    boxes[:, 3] = boxes[:, 1] + boxes[:, 3]
+    boxes[:, [0, 2]] *= orig_w / 640
+    boxes[:, [1, 3]] *= orig_h / 640
+    boxes = np.clip(boxes, 0, [orig_w, orig_h, orig_w, orig_h])
+    indices = cv2.dnn.NMSBoxes(boxes.tolist(), scores.tolist(), conf_thres, 0.5)
+    object_counts = {name: 0 for name in OBJECT_NAMES}
+    img_array = np.array(image)
+    if len(indices) > 0:
+        for i in indices.flatten():
+            x1, y1, x2, y2 = map(int, boxes[i])
+            cls = class_ids[i]
+            object_name = OBJECT_NAMES[cls] if cls < len(OBJECT_NAMES) else f"Unknown ({cls})"
+            if object_name in object_counts:
+                object_counts[object_name] += 1
+            cv2.rectangle(img_array, (x1, y1), (x2, y2), (0, 255, 0), 2)
+            cv2.putText(img_array, f"{object_name}: {scores[i]:.2f}", (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 0), 2)
+    # Generate and return graph instead of dictionary
+    graph_image = generate_vehicle_count_graph(object_counts)
+    return Image.fromarray(img_array), graph_image  # Now returning only 2 outputs
+# def generate_vehicle_count_graph(object_counts):
+#     color_palette = ['#4C9ACD', '#88B8A3', '#7F9C9C', '#D1A3B5', '#A1C6EA', '#FFB6C1', '#F0E68C', '#D3B0D8', '#F8A5D1', '#B8B8D1']
+#     fig, ax = plt.subplots(figsize=(8, 5))
+#     labels = list(object_counts.keys())
+#     values = list(object_counts.values())
+#     ax.bar(labels, values, color=color_palette[:len(labels)])
+#     ax.set_xlabel("Vehicle Categories", fontsize=12, fontweight='bold')
+#     ax.set_ylabel("Number of Vehicles", fontsize=12, fontweight='bold')
+#     ax.set_title("Detected Vehicles in Image", fontsize=14, fontweight='bold')
+#     plt.xticks(rotation=45, ha='right', fontsize=10)
+#     plt.yticks(fontsize=10)
+#     plt.tight_layout()
+#     buf = BytesIO()
+#     plt.savefig(buf, format='png')
+#     buf.seek(0)
+#     return Image.open(buf)
+def generate_vehicle_count_graph(object_counts):
+    color_palette = ['#4C9ACD', '#88B8A3', '#7F9C9C', '#D1A3B5', '#A1C6EA', '#FFB6C1', '#F0E68C', '#D3B0D8', '#F8A5D1', '#B8B8D1']
+    fig, ax = plt.subplots(figsize=(8, 5))
+    labels = list(object_counts.keys())
+    values = list(object_counts.values())
+    ax.bar(labels, values, color=color_palette[:len(labels)])
+    ax.set_xlabel("Vehicle Categories", fontsize=12, fontweight='bold')
+    ax.set_ylabel("Number of Vehicles", fontsize=12, fontweight='bold')
+    ax.set_title("Detected Vehicles in Image", fontsize=14, fontweight='bold')
+    plt.xticks(rotation=45, ha='right', fontsize=10)
+    plt.yticks(fontsize=10)
+    plt.tight_layout()
+    buf = BytesIO()
+    plt.savefig(buf, format='png')
+    buf.seek(0)
+    plt.close(fig)  # ✅ CLOSE THE FIGURE TO FREE MEMORY
+    return Image.open(buf)
+def detect_objects_in_video(video_input):
+    cap = cv2.VideoCapture(video_input)
+    if not cap.isOpened():
+        return "Error: Cannot open video file.", None  # Returning a second value (None) to match expected outputs
+    frame_width, frame_height, fps = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH)), int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT)), int(cap.get(cv2.CAP_PROP_FPS))
+    temp_video_output = tempfile.NamedTemporaryFile(suffix=".mp4", delete=False).name
+    out = cv2.VideoWriter(temp_video_output, cv2.VideoWriter_fourcc(*'mp4v'), fps, (frame_width, frame_height))
+    # Initialize the counts for vehicle categories
+    total_counts = {name: 0 for name in ['car', 'truck', 'bus', 'motorcycle', 'bicycle']}
+    while cap.isOpened():
+        ret, frame = cap.read()
+        if not ret:
+            break
+        image = Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
+        # Get frame with detected objects and graph
+        frame_with_boxes, graph_image = detect_objects_in_image(image)
+        # Convert image back to OpenCV format for writing video
+        out.write(cv2.cvtColor(np.array(frame_with_boxes), cv2.COLOR_RGB2BGR))
+    cap.release()
+    out.release()
+    return temp_video_output, graph_image  # Return both expected outputs
 def greet(name):
     return "Hello " + name + "!!"