# # if you don't have them already, download supervision and torch  
# !pip install supervision torch -q 
# !pip install -q moviepy

from moviepy.editor import VideoFileClip
from IPython.display import Image

import numpy as np
import os
import supervision as sv
import torch


MODEL_PATH = "../../models/fathomnet_benthic/mbari-mb-benthic-33k.pt"
# model = torch.hub.load('ultralytics/yolov5', 'custom', path=model_name,  force_reload=True)

class YOLOv5_ByteTracker:

    def __init__(self, model_path=MODEL_PATH, **tracker_params):
        self.model = torch.hub.load('ultralytics/yolov5', 'custom', path=model_path,  force_reload=True)
        
        self.init_tracker(**tracker_params)  # create self.tracker and self.suffix attributes

        self.box_annotator = sv.BoundingBoxAnnotator()
        self.label_annotator = sv.LabelAnnotator()


    def init_tracker(self, **tracker_params):
        """Update the tracker parameters."""
        # for systematic naming of output files
        self.suffix = "_".join([f"{k}{v}" for k, v in tracker_params.items()]) if tracker_params else None

        self.tracker = sv.ByteTrack(**tracker_params)


    def callback(self, frame: np.ndarray, index: int) -> np.ndarray:
        """Detection callback callled for each frame in the video. Used in process_video later"""

        # frame = super_resolution_model(frame)  # TODO add when ready
        results = self.model(frame) #[0]
        detections = sv.Detections.from_yolov5(results)
        detections = self.tracker.update_with_detections(detections)
        labels = [
            f"#{tracker_id} {self.model.model.names[class_id]} {confidence:0.2f}"
            for bbox, _, confidence, class_id, tracker_id, _
            in detections
        ]
        frame = self.box_annotator.annotate(scene=frame.copy(), detections=detections)
        frame = self.label_annotator.annotate(scene=frame.copy(), detections=detections, labels=labels)
        return frame


    def mot(self, name, data_dir="../data/example", output_dir="../data/results", ext="mp4"):
        """Apply the MOT callback to a video and save the result to a new file."""
        output_name = name.split("/")[-1] if "/" in name else name
        if self.suffix:
            output_name += f"_{self.suffix}"
        
        sv.process_video(
            source_path=f"{data_dir}/{name}.{ext}", 
            target_path=f"{output_dir}/{output_name}_mot.{ext}", 
            callback=self.callback
        )

        return f"{output_dir}/{output_name}_mot.{ext}"


    def vid2gif(self, video_path, gif_path):
        """Convert a video to a gif."""
        clip = VideoFileClip(video_path)
        clip.write_gif(gif_path)
        return gif_path


    def mot_show(self, name, data_dir="../data/example", output_dir="../data/results", ext="mp4"):
        """Wrapper to display the result of the MOT callback as a gif."""
        mot_output_path = self.mot(name, data_dir, output_dir, ext)
        gif_output_path = self.vid2gif(mot_output_path, mot_output_path.replace(".mp4", ".gif"))

        # display the gif
        return Image(filename=gif_output_path)


tracker = YOLOv5_ByteTracker(MODEL_PATH)
tracker.mot_show("sea_feather")

Downloading: "https://github.com/ultralytics/yolov5/zipball/master" to /Users/per.morten.halvorsen@schibsted.com/.cache/torch/hub/master.zip
YOLOv5 🚀 2024-4-7 Python-3.11.8 torch-2.2.2 CPU

Fusing layers... 
Model summary: 476 layers, 91841704 parameters, 0 gradients
Adding AutoShape...

MoviePy - Building file ../data/results/sea_feather_mot.gif with imageio.

<IPython.core.display.Image object>

tracker.init_tracker(track_activation_threshold=0.4)
tracker.mot_show("sea_feather")

MoviePy - Building file ../data/results/sea_feather_track_activation_threshold0.4_mot.gif with imageio.

<IPython.core.display.Image object>

tracker.init_tracker(track_activation_threshold=0.29)
tracker.mot_show("sea_feather")

MoviePy - Building file ../data/results/sea_feather_track_activation_threshold0.29_mot.gif with imageio.

<IPython.core.display.Image object>

tracker.init_tracker(track_activation_threshold=0.29, lost_track_buffer=1)
tracker.mot_show("sea_feather")

MoviePy - Building file ../data/results/sea_feather_track_activation_threshold0.29_lost_track_buffer1_mot.gif with imageio.

<IPython.core.display.Image object>

# i = 0  # change this to the video you want to process
# tracker.mot_show(f"aquarium_{i:03}/aquarium_{i:03}", data_dir="../data/video", output_dir="../data/results", ext="mp4")

Multiple object tracking¶

Overview¶

Background¶

Object detection¶

Object tracking¶

Tools for tracking¶

Classic¶

Segmentation¶

Background detection¶

Contour detection¶

Mean-shift clustering/segmentation¶

Association¶

Kalman filter (SORT)¶

Hungarian algorithm (SORT)¶

Mahalanobis Distance¶

Modern¶

SORT¶

DeepSORT¶

ByteTrack¶

Implementation¶

ByteTrack (Roboflow)¶

Imports¶

ByteTrack (default)¶

ByteTrack parameters¶

Conclusion¶

Extra resources¶

Disclaimer¶

Up next: Dockerizing our pipeline¶