Merge 05dbf15213dfd8ba4e0ef8b5ea82ee3821497d6f into 453c6e38a51e9d1d5a2aa5fb7f1014a711913397

Update README.md
Create object_tracking_yolov10_rtsp_stream.py
2025-07-16 03:45:40 +08:00 · 2025-03-17 19:03:59 +08:00 · 2025-03-14 10:53:57 +08:00 · 2024-11-17 21:41:26 +05:00
2 changed files with 82 additions and 1 deletions
--- a/README.md
+++ b/README.md
@ -10,7 +10,7 @@ Please check out our new release on [**YOLOE**](https://github.com/THU-MIG/yoloe
  Comparison of performance, training cost, and inference efficiency between YOLOE (Ours) and YOLO-Worldv2 in terms of open text prompts.
 </p>

-**YOLOE(ye)** is a highly **efficient**, **unified**, and **open** object detection and segmentation model for real-time seeing anything, like human eye, under different prompt mechanisms, like *texts*, *visual inputs*, and *prompt-free paradigm*.
+**YOLOE(ye)** is a highly **efficient**, **unified**, and **open** object detection and segmentation model for real-time seeing anything, like human eye, under different prompt mechanisms, like *texts*, *visual inputs*, and *prompt-free paradigm*, with **zero inference and transferring overhead** compared with closed-set YOLOs.

 <p align="center">
  <img src="https://github.com/THU-MIG/yoloe/blob/main/figures/visualization.svg" width=96%> <br>
--- a/examples/object_tracking_yolov10_rtsp_stream.py
+++ b/examples/object_tracking_yolov10_rtsp_stream.py
@ -0,0 +1,81 @@
+import cv2
+import numpy as np
+import os
+from ultralytics import YOLO
+from ultralytics.utils.checks import check_imshow
+from ultralytics.utils.plotting import Annotator, colors
+from collections import defaultdict
+
+# Replace with your RTSP URL
+rtsp_url = "rtsp://192.168.100.10/live/1"
+
+# Open a connection to the RTSP stream
+cap = cv2.VideoCapture(rtsp_url)
+
+
+track_history = defaultdict(lambda: [])
+model = YOLO("yolov10s.pt")
+names = model.model.names
+
+if not cap.isOpened():
+    print("Error: Could not open RTSP stream.")
+else:
+    print("RTSP stream opened successfully.")
+
+# Read the first frame to initialize background
+ret, frame1 = cap.read()
+
+w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
+
+if not ret:
+    print("Failed to retrieve frame. Exiting...")
+    cap.release()
+    cv2.destroyAllWindows()
+    exit()
+
+
+while cap.isOpened():
+    success, frame = cap.read()
+    if not success:
+        print("Failed to retrieve frame. Exiting...")
+        break
+
+    if success:
+        results = model.track(frame, persist=True, verbose=False)
+        boxes = results[0].boxes.xyxy.cpu()
+
+        if results[0].boxes.id is not None:
+            # Extract prediction results
+            clss = results[0].boxes.cls.cpu().tolist()
+            track_ids = results[0].boxes.id.int().cpu().tolist()
+            confs = results[0].boxes.conf.float().cpu().tolist()
+             
+            # Annotator Init
+            annotator = Annotator(frame, line_width=2)
+            
+            for box, cls, track_id in zip(boxes, clss, track_ids):
+                annotator.box_label(box, color=colors(int(cls), True), label=names[int(cls)])
+
+                # Store tracking history
+                track = track_history[track_id]
+                track.append((int((box[0] + box[2]) / 2), int((box[1] + box[3]) / 2)))
+                if len(track) > 30:
+                    track.pop(0)
+                
+                # Plot tracks
+                points = np.array(track, dtype=np.int32).reshape((-1, 1, 2))
+                cv2.circle(frame, (track[-1]), 7, colors(int(cls), True), -1)
+                cv2.polylines(frame, [points], isClosed=False, color=colors(int(cls), True), thickness=2)
+
+
+    # Display the frames
+    cv2.imshow("Original Frame", frame)
+    # Break the loop on 'q' key press
+    if cv2.waitKey(1) & 0xFF == ord('q'):
+        print("Exiting...")
+        break
+
+
+# Release resources
+cap.release()
+cv2.destroyAllWindows()
Author	SHA1	Message	Date
Umair Bin Ahmad	748a8f010e	Merge 05dbf15213dfd8ba4e0ef8b5ea82ee3821497d6f into 453c6e38a51e9d1d5a2aa5fb7f1014a711913397	2025-03-17 19:03:59 +08:00
Wang Ao	453c6e38a5	Update README.md	2025-03-14 10:53:57 +08:00
Umair Bin Ahmad	05dbf15213	Create object_tracking_yolov10_rtsp_stream.py	2024-11-17 21:41:26 +05:00