Object-Detection-and-Tracking/detect_and_track.py at main · aryansengar007/Object-Detection-and-Tracking · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
import cv2
import numpy as np
import time
from ultralytics import YOLO

def process_video(source, model_variant, conf=0.5, stframe=None, use_deepsort=False,
                  class_filter=None, show_fps=True, show_logs=False):
    model = YOLO(f"{model_variant}.pt")
    cap = cv2.VideoCapture(source)
    width, height = int(cap.get(3)), int(cap.get(4))
    out_path = "output_processed.mp4"
    out = cv2.VideoWriter(out_path, cv2.VideoWriter_fourcc(*'mp4v'), 20, (width, height))

    object_count = {}
    logs = []
    prev_time = time.time()

    while cap.isOpened():
        ret, frame = cap.read()
        if not ret:
            break

        results = model.predict(frame, conf=conf)[0]
        detections = results.boxes.data.cpu().numpy()

        for det in detections:
            x1, y1, x2, y2, confidence, cls = map(int, det[:6])
            class_name = model.names[int(cls)]
            if not class_filter or class_name in class_filter:
                object_count[class_name] = object_count.get(class_name, 0) + 1
                cv2.rectangle(frame, (x1, y1), (x2, y2), (0, 255, 0), 2)
                label = f"{class_name} {confidence:.2f}"
                cv2.putText(frame, label, (x1, y1 - 10),
                            cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0, 255, 0), 2)
                if show_logs:
                    logs.append(label)

        if show_fps:
            curr_time = time.time()
            fps = 1 / (curr_time - prev_time)
            prev_time = curr_time
            cv2.putText(frame, f"FPS: {int(fps)}", (20, 30),
                        cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 255, 255), 2)

        out.write(frame)
        if stframe:
            stframe.image(frame, channels="BGR", use_container_width=True)

    cap.release()
    out.release()
    return out_path, object_count, logs

def process_image(image, model_variant, use_deepsort=False, class_filter=None, conf=0.5, show_logs=False):
    model = YOLO(f"{model_variant}.pt")
    results = model.predict(image, conf=conf)[0]
    detections = results.boxes.data.cpu().numpy()
    object_count = {}
    logs = []
    count = 0

    for det in detections:
        x1, y1, x2, y2, confidence, cls = map(int, det[:6])
        class_name = model.names[int(cls)]
        if not class_filter or class_name in class_filter:
            count += 1
            object_count[class_name] = object_count.get(class_name, 0) + 1
            label = f"{class_name} {confidence:.2f}"
            logs.append(label)
            cv2.rectangle(image, (x1, y1), (x2, y2), (255, 0, 0), 2)
            cv2.putText(image, label, (x1, y1 - 10),
                        cv2.FONT_HERSHEY_SIMPLEX, 0.6, (255, 0, 0), 2)

    return image, count, object_count, logs