Upload 5 files

Browse files

FOSS models release 1.0

Files changed (5) hide show

run_sliced_inference.py +141 -0
run_sliced_inference_with_tracker.py +152 -0
unidrone_yolov8m_640px.zip +3 -0
unidrone_yolov8n_448px.zip +3 -0
unidrone_yolov8n_640px.zip +3 -0

run_sliced_inference.py ADDED Viewed

	@@ -0,0 +1,141 @@

+import cv2
+import sys
+import os
+import numpy as np
+from sahi import AutoDetectionModel
+from sahi.predict import get_sliced_prediction, get_prediction
+import supervision as sv
+# Check the number of command-line arguments
+if len(sys.argv) != 8:
+    print("Usage: python yolov8_video_inference.py <model_path> <input_path> <output_path> <slice_height> <slice_width> <overlap_height_ratio> <overlap_width_ratio>")
+    sys.exit(1)
+# Get command-line arguments
+model_path = sys.argv[1]
+input_path = sys.argv[2]
+output_path = sys.argv[3]
+slice_height = int(sys.argv[4])
+slice_width = int(sys.argv[5])
+overlap_height_ratio = float(sys.argv[6])
+overlap_width_ratio = float(sys.argv[7])
+# Load YOLOv8 model with SAHI
+detection_model = AutoDetectionModel.from_pretrained(
+    model_type='yolov8',  # or 'yolov8'
+    model_path=model_path,
+    confidence_threshold=0.1,
+    device="cpu"  # or "cuda"
+)
+# Annotators
+box_annotator = sv.BoxCornerAnnotator(thickness=2)
+label_annotator = sv.LabelAnnotator(text_scale=0.5, text_thickness=2)
+def annotate_image(image, object_predictions):
+    """
+    Given an OpenCV image and a list of object predictions from SAHI,
+    returns an annotated copy of that image.
+    """
+    if not object_predictions:
+        return image.copy()
+    xyxy, confidences, class_ids, class_names = [], [], [], []
+    for pred in object_predictions:
+        bbox = pred.bbox.to_xyxy()  # [x1, y1, x2, y2]
+        xyxy.append(bbox)
+        confidences.append(pred.score.value)
+        class_ids.append(pred.category.id)
+        class_names.append(pred.category.name)
+    xyxy = np.array(xyxy, dtype=np.float32)
+    confidences = np.array(confidences, dtype=np.float32)
+    class_ids = np.array(class_ids, dtype=int)
+    detections = sv.Detections(
+        xyxy=xyxy,
+        confidence=confidences,
+        class_id=class_ids
+    )
+    labels = [f"{cn} {conf:.2f}" for cn, conf in zip(class_names, confidences)]
+    annotated = image.copy()
+    annotated = box_annotator.annotate(scene=annotated, detections=detections)
+    annotated = label_annotator.annotate(scene=annotated, detections=detections, labels=labels)
+    return annotated
+def run_sliced_inference(image):
+    result = get_sliced_prediction(
+        image=image,
+        detection_model=detection_model,
+        slice_height=slice_height,
+        slice_width=slice_width,
+        overlap_height_ratio=overlap_height_ratio,
+        overlap_width_ratio=overlap_width_ratio
+    )
+    return annotate_image(image, result.object_prediction_list)
+def run_full_inference(image):
+    # Normal inference without slicing
+    result = get_prediction(
+        image=image,
+        detection_model=detection_model
+        # postprocess_match_threshold=0.5,  # If you want to adjust the post-processing threshold
+    )
+    return annotate_image(image, result.object_prediction_list)
+# Determine if the input is an image or video based on file extension
+_, ext = os.path.splitext(input_path.lower())
+image_extensions = [".png", ".jpg", ".jpeg", ".bmp"]
+if ext in image_extensions:
+    # ----- IMAGE PROCESSING -----
+    image = cv2.imread(input_path)
+    if image is None:
+        print(f"Error loading image: {input_path}")
+        sys.exit(1)
+    h, w = image.shape[:2]
+    # Decide whether or not to slice
+    if False:  #(h > slice_height) or (w > slice_width):
+        # If the image is bigger than slice dims, do sliced inference
+        annotated_image = run_sliced_inference(image)
+    else:
+        # Otherwise do normal inference
+        annotated_image = run_full_inference(image)
+    cv2.imwrite(output_path, annotated_image)
+    print(f"Inference complete. Annotated image saved at '{output_path}'")
+else:
+    # ----- VIDEO PROCESSING -----
+    cap = cv2.VideoCapture(input_path)
+    if not cap.isOpened():
+        print(f"Error opening video: {input_path}")
+        sys.exit(1)
+    width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+    height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+    fps = cap.get(cv2.CAP_PROP_FPS)
+    fourcc = cv2.VideoWriter_fourcc(*"mp4v")
+    out = cv2.VideoWriter(output_path, fourcc, fps, (width, height))
+    frame_count = 0
+    while cap.isOpened():
+        ret, frame = cap.read()
+        if not ret:
+            break
+        # For each frame, you may or may not want slicing. Usually, you can do normal slicing if needed.
+        annotated_frame = run_sliced_inference(frame)
+        out.write(annotated_frame)
+        frame_count += 1
+        print(f"Processed frame {frame_count}", end='\r')
+    cap.release()
+    out.release()
+    print(f"\nInference complete. Video saved at '{output_path}'")

run_sliced_inference_with_tracker.py ADDED Viewed

	@@ -0,0 +1,152 @@

+import cv2
+import sys
+from sahi.models.yolov8 import Yolov8DetectionModel
+from sahi.predict import get_sliced_prediction
+import supervision as sv
+import numpy as np
+# Check the number of command-line arguments
+if len(sys.argv) != 8:
+    print("Usage: python yolov8_video_inference.py <model_path> <input_video_path> <output_video_path> <slice_height> <slice_width> <overlap_height_ratio> <overlap_width_ratio>")
+    sys.exit(1)
+# Get command-line arguments
+model_path = sys.argv[1]
+input_video_path = sys.argv[2]
+output_video_path = sys.argv[3]
+slice_height = int(sys.argv[4])
+slice_width = int(sys.argv[5])
+overlap_height_ratio = float(sys.argv[6])
+overlap_width_ratio = float(sys.argv[7])
+# Load YOLOv8 model with SAHI
+detection_model = Yolov8DetectionModel(
+    model_path=model_path,
+    confidence_threshold=0.25,
+    device="cuda"  # or "cpu"
+)
+# Get video info
+video_info = sv.VideoInfo.from_video_path(video_path=input_video_path)
+# Open input video
+cap = cv2.VideoCapture(input_video_path)
+width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+fps = cap.get(cv2.CAP_PROP_FPS)
+fourcc = cv2.VideoWriter_fourcc(*"mp4v")
+# Set up output video writer
+out = cv2.VideoWriter(output_video_path, fourcc, fps, (width, height))
+# Initialize tracker and smoother
+tracker = sv.ByteTrack(frame_rate=video_info.fps)
+smoother = sv.DetectionsSmoother()
+# Create bounding box and label annotators
+box_annotator = sv.BoxCornerAnnotator(thickness=2)
+label_annotator = sv.LabelAnnotator(
+    text_scale=0.5,
+    text_thickness=1,
+    text_padding=1
+)
+# Process each frame
+frame_count = 0
+class_id_to_name = {}  # Initialize once to store class_id to name mapping
+while cap.isOpened():
+    ret, frame = cap.read()
+    if not ret:
+        break
+    # Perform sliced inference on the current frame using SAHI
+    result = get_sliced_prediction(
+        image=frame,
+        detection_model=detection_model,
+        slice_height=slice_height,
+        slice_width=slice_width,
+        overlap_height_ratio=overlap_height_ratio,
+        overlap_width_ratio=overlap_width_ratio
+    )
+    # Extract data from SAHI result
+    object_predictions = result.object_prediction_list
+    # Initialize lists to hold the data
+    xyxy = []
+    confidences = []
+    class_ids = []
+    # Build or update class_id to name mapping
+    for pred in object_predictions:
+        if pred.category.id not in class_id_to_name:
+            class_id_to_name[pred.category.id] = pred.category.name
+    # Loop over the object predictions and extract data
+    for pred in object_predictions:
+        bbox = pred.bbox.to_xyxy()  # Convert bbox to [x1, y1, x2, y2]
+        xyxy.append(bbox)
+        confidences.append(pred.score.value)
+        class_ids.append(pred.category.id)
+    # Check if there are any detections
+    if xyxy:
+        # Convert lists to numpy arrays
+        xyxy = np.array(xyxy, dtype=np.float32)
+        confidences = np.array(confidences, dtype=np.float32)
+        class_ids = np.array(class_ids, dtype=int)
+        # Create sv.Detections object
+        detections = sv.Detections(
+            xyxy=xyxy,
+            confidence=confidences,
+            class_id=class_ids
+        )
+        # Update tracker with detections
+        detections = tracker.update_with_detections(detections)
+        # Update smoother with detections
+        detections = smoother.update_with_detections(detections)
+        # Prepare labels for label annotator
+        # Include tracker ID in labels if available
+        labels = []
+        for i in range(len(detections.xyxy)):
+            class_id = detections.class_id[i]
+            confidence = detections.confidence[i]
+            class_name = class_id_to_name.get(class_id, 'Unknown')
+            label = f"{class_name} {confidence:.2f}"
+            # Add tracker ID if available
+            if hasattr(detections, 'tracker_id') and detections.tracker_id is not None:
+                tracker_id = detections.tracker_id[i]
+                label = f"ID {tracker_id} {label}"
+            labels.append(label)
+        # Annotate frame with detection results
+        annotated_frame = frame.copy()
+        annotated_frame = box_annotator.annotate(
+            scene=annotated_frame,
+            detections=detections
+        )
+        annotated_frame = label_annotator.annotate(
+            scene=annotated_frame,
+            detections=detections,
+            labels=labels
+        )
+    else:
+        # If no detections, use the original frame
+        annotated_frame = frame.copy()
+    # Write the annotated frame to the output video
+    out.write(annotated_frame)
+    frame_count += 1
+    print(f"Processed frame {frame_count}", end='\r')
+# Release resources
+cap.release()
+out.release()
+print("\nInference complete. Video saved at", output_video_path)

unidrone_yolov8m_640px.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ab44f269ec1c57087b30e54aa17aeff6470fa6a6d17d6329b507f396b109d1d2
+size 97694621

unidrone_yolov8n_448px.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d1ec33a56bfd4ff1fb4f4f0f90a9852746428b33b4681041c1b1096a13581c54
+size 13055080

unidrone_yolov8n_640px.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b60edd7ede370fdbb89b91aec2ed2f0f0650a86f6cfa8fabb9e32f62a0a7de78
+size 13111623