# %pip install -r ../requirements.txt

from torchvision.transforms.functional_tensor import rgb_to_grayscale

# import basicsr.data.degradations

# %load_ext autoreload
# %autoreload 2

from fathomnet.models.yolov5 import YOLOv5Model
from IPython.display import display
from pathlib import Path
from PIL import Image
from PIL import ImageOps
from pycocotools.coco import COCO
from torch.profiler import profile, record_function, ProfilerActivity
from typing import List, Union

import cv2
import json
import numpy as np
import onnxruntime
import os
import torch 

# ABPN imports 
from tqdm.auto import tqdm

# ESRGAN imports 
from basicsr.archs.rrdbnet_arch import RRDBNet
from realesrgan import RealESRGANer

root_dir = Path(os.getcwd().split("personal/")[0])
repo_dir = root_dir / "personal" / "ocean-species-identification"
data_dir = root_dir / "data" / "TrashCAN"
models_dir = root_dir / "personal" / "models"

!source $repo_dir/scripts/get_hat.sh $repo_dir

from hat.archs.hat_arch import HAT

# reuse some code from preivous notebook ported to src.data
os.chdir(repo_dir)
from src.data import images_per_category
from src.evaluation import evaluate_model

benthic_model_weights_path = models_dir / "fathomnet_benthic" / "mbari-mb-benthic-33k.pt"

benthic_model = YOLOv5Model(benthic_model_weights_path)
trashcan_data = COCO(data_dir / "dataset" / "material_version" / "instances_val_trashcan.json")
benthic2trashcan_ids = json.load(open(repo_dir / "data" / "benthic2trashcan_ids.json"))

Using cache found in /Users/per.morten.halvorsen@schibsted.com/.cache/torch/hub/ultralytics_yolov5_master
YOLOv5 🚀 2024-3-16 Python-3.11.5 torch-2.2.1 CPU

Fusing layers... 
Model summary: 476 layers, 91841704 parameters, 0 gradients
Adding AutoShape...

loading annotations into memory...
Done (t=0.04s)
creating index...
index created!

# benthic_model._model.eval()

# get only starfish images using src.data.image_from_category
starfish_images = images_per_category("animal_starfish", trashcan_data, data_dir / "dataset" / "material_version" / "val")

example_image_path = starfish_images[3]
example_image = Image.open(example_image_path)
print(np.array(example_image).shape)
display(example_image)

(270, 480, 3)

# abpn_model_path = models_dir / "sr_mobile_python" / "models_modelx2.ort"
abpn_model_path = models_dir / "sr_mobile_python" / "models_modelx4.ort"

class ABPN(torch.nn.Module):
    def __init__(self, model_path: str, store:bool=True):
        self.model_path = model_path
        self.saved_imgs = {}
        self.store = store

    def pre_process(self, img: np.array) -> np.array:
        # H, W, C -> C, H, W
        img = np.transpose(img[:, :, 0:3], (2, 0, 1))
        # C, H, W -> 1, C, H, W
        img = np.expand_dims(img, axis=0).astype(np.float32)
        return img


    def post_process(self, img: np.array) -> np.array:
        # 1, C, H, W -> C, H, W
        img = np.squeeze(img)
        # C, H, W -> H, W, C
        img = np.transpose(img, (1, 2, 0))
        return img


    def save(self, img: np.array, save_name: str) -> None:
        # cv2.imwrite(save_name, img)
        if self.store:
            self.saved_imgs[save_name] = img


    def inference(self, img_array: np.array) -> np.array:
        # unasure about ability to train an onnx model from a Mac
        ort_session = onnxruntime.InferenceSession(self.model_path)
        ort_inputs = {ort_session.get_inputs()[0].name: img_array}
        ort_outs = ort_session.run(None, ort_inputs)

        return ort_outs[0]


    def upsample(self, image_paths: List[str]):
        outputs = []

        for image_path in tqdm(image_paths):

            img = cv2.imread(image_path, cv2.IMREAD_UNCHANGED)
            # filename = os.path.basename(image_path)

            if img.ndim == 2:
                img = cv2.cvtColor(img, cv2.COLOR_GRAY2BGR)

            if img.shape[2] == 4:
                alpha = img[:, :, 3]  # GRAY
                alpha = cv2.cvtColor(alpha, cv2.COLOR_GRAY2BGR)  # BGR
                alpha_output = self.post_process(
                    self.inference(self.pre_process(alpha))
                )  # BGR
                alpha_output = cv2.cvtColor(alpha_output, cv2.COLOR_BGR2GRAY)  # GRAY

                img = img[:, :, 0:3]  # BGR
                image_output = self.post_process(
                    self.inference(self.pre_process(img))
                )  # BGR
                output_img = cv2.cvtColor(image_output, cv2.COLOR_BGR2BGRA)  # BGRA
                output_img[:, :, 3] = alpha_output
                self.save(output_img, Path(image_path).stem)
            elif img.shape[2] == 3:
                image_output = self.post_process(
                    self.inference(self.pre_process(img))
                )  # BGR
                self.save(image_output, Path(image_path).stem)

            outputs += [image_output.astype('uint8')]

        return outputs

abpn_model = ABPN(abpn_model_path)

abpn_upsampled = abpn_model.upsample([str(example_image_path)])[0]
abpn_upsampled.shape

  0%|          | 0/1 [00:00<?, ?it/s]

(1080, 1920, 3)

Image.fromarray(abpn_upsampled)

# check the scale of the super-resolution image
x_scale = abpn_upsampled.shape[1] / example_image.size[0]
y_scale = abpn_upsampled.shape[0] / example_image.size[1]

(x_scale, y_scale)

(4.0, 4.0)

class ESRGAN(torch.nn.Module):
    def __init__(
        self, 
        model_name: str="realesr-general-x4v3", 
        model_dir: str="./",
        tile=0, 
        tile_pad=10, 
        pre_pad=0, 
        half=False, 
        device=None
    ):
        super(ESRGAN, self).__init__()
        # model path and name
        self.model_dir = model_dir
        self.model_path  = os.path.join(model_dir, model_name + '.pth') 
        self.model_name = model_name
        self.check_model_present()

        # RRDN parameters specific to pretrained model instance: v0.1.0/RealESRGAN_x4plus
        self.model = RRDBNet(num_in_ch=3, num_out_ch=3, num_feat=64, num_block=23, num_grow_ch=32, scale=4)

        # other model parameters
        self.netscale = 4
        self.tile = tile
        self.tile_pad = tile_pad
        self.pre_pad = pre_pad
        self.half = half

        # acutal sr module
        self.upsampler = RealESRGANer(
            scale=self.netscale,
            model_path=self.model_path,
            model=self.model,
            tile=self.tile,
            tile_pad=self.tile_pad,
            pre_pad=self.pre_pad,
            half=self.half
        )

        # realesrgan tries to cast to cuda, but not mps for Mac users 
        if device:
            self.device = torch.device(device)
            self.upsampler.device = torch.device(device)
            self.upsampler.model = self.upsampler.model.to(torch.device(device))


    def upsample(self, image_paths: List[str]):
        outputs = []

        for image_path in tqdm(image_paths):
            img = Image.open(image_path)
            img = np.array(img)
            img = self.upsampler.enhance(img)[0]  # 2nd dim not needed, specifies output type 'RGB
            outputs += [img]

        return outputs


    def check_model_present(self):
        # sanity check before proceeding
        if not os.path.isfile(self.model_path):
            raise ValueError(
                f"Model {self.model_name} not found locally at \n" \
                f"{self.model_path}. \n" \
                "Download https://github.com/xinntao/Real-ESRGAN/releases/download/v0.1.0/RealESRGAN_x4plus.pth"
            )

esrgan_model = ESRGAN(model_name="RealESRGAN_x4plus", model_dir=models_dir/"ESRGAN", device="mps")  # mps to speed up inference on Macs

print(esrgan_model.upsampler.device)

mps

esrgan_upsampled = esrgan_model.upsample([example_image_path])[0]
print(esrgan_upsampled.shape)
Image.fromarray(esrgan_upsampled)

  0%|          | 0/1 [00:00<?, ?it/s]

(1080, 1920, 3)

class Hat(torch.nn.Module):
    """
    Config for the pretrained instance we are using found at:
    https://github.com/XPixelGroup/HAT/blob/main/options/test/HAT_SRx4_ImageNet-pretrain.yml
    """

    def __init__(
        self, 
        weight_path: str = "HAT_SRx4_ImageNet-pretrain.pth", 
        upscale = 4,
        in_chans = 3,
        img_size = 64,
        window_size = 16,
        compress_ratio = 3,
        squeeze_factor = 30,
        conv_scale = 0.01,
        overlap_ratio = 0.5,
        img_range = 1.,
        depths = [6, 6, 6, 6, 6, 6],
        embed_dim = 180,
        num_heads = [6, 6, 6, 6, 6, 6],
        mlp_ratio = 2,
        upsampler = 'pixelshuffle',
        resi_connection = '1conv',
        grad=False,
        verbose=False,
        device=None,
    ):
        super(Hat, self).__init__()
        self.model = HAT(
            upscale = upscale,
            in_chans = in_chans,
            img_size = img_size,
            window_size = window_size,
            compress_ratio = compress_ratio,
            squeeze_factor = squeeze_factor,
            conv_scale = conv_scale,
            overlap_ratio = overlap_ratio,
            img_range = img_range,
            depths = depths,
            embed_dim = embed_dim,
            num_heads = num_heads,
            mlp_ratio = mlp_ratio,
            upsampler = upsampler,
            resi_connection = resi_connection,
        )

        self.model.load_state_dict(torch.load(weight_path)['params_ema'])

        # cast to device
        if device:
            self.model.to(torch.device(device))
            self.device = device 
        else:
            self.device = self.model.device

        self.no_grad() if not grad else None
        self.verbose = verbose


    def set_device(self, device):
        self.model.to(torch.device(device))
        self.device = device


    def no_grad(self):
        self.model.eval()

        for param in self.model.parameters():
            param.requires_grad = False


    def crop_image(self, image, size):
        return ImageOps.fit(image, size, Image.LANCZOS)


    def resize_image(self, image, size):
        # Get the size of the current image
        old_size = image.size

        # Calculate the ratio of the new size and the old size
        ratio = min(float(size[i]) / float(old_size[i]) for i in range(len(size)))

        # Calculate the new size
        new_size = tuple([int(i*ratio) for i in old_size])

        # Resize the image
        image = image.resize(new_size, Image.LANCZOS)

        # Create a new image with the specified size and fill it with white color
        new_image = Image.new("RGB", size, "white")

        # Calculate the position to paste the resized image
        position = ((size[0] - new_size[0]) // 2, (size[1] - new_size[1]) // 2)

        # Paste the resized image to the new image
        new_image.paste(image, position)

        return new_image


    def upsample(self, image_paths: List[str]):

        outputs = []

        for image_path in tqdm(image_paths):
            # load image
            img = Image.open(image_path)
            img_shape = np.array(img).shape

            # crop image to size w/ factor of 16
            input_size = img_shape[0] - (img_shape[0] % 16)
            cropped_img = self.crop_image(img, (input_size, input_size))
            display(cropped_img) if self.verbose else None

            # prep image dimension order
            input_img = torch.tensor(np.array(cropped_img)).to(self.device).permute(2, 0, 1)

            # feed to model
            output_tensor = self.model.forward(input_img)

            # post process to maintain aspect ratio, ensuring labels are still accurate
            output_array = output_tensor.squeeze(0).permute(1, 2, 0).cpu().numpy()
            output_img = Image.fromarray((output_array).astype(np.uint8)).convert('RGB')  
            scaled_output_size = (img_shape[1]*self.model.upscale, img_shape[0]*self.model.upscale)
            img = self.resize_image(output_img, scaled_output_size)

            outputs += [np.array(img)]

        return outputs
    

hat_model = Hat(models_dir / "HAT" / "HAT_SRx4_ImageNet-pretrain.pth", device="mps")
hat_upsampled = hat_model.upsample([example_image_path])
Image.fromarray(hat_upsampled[0])

  0%|          | 0/1 [00:00<?, ?it/s]

example_detections = benthic_model._model(example_image)
abpn_detections = benthic_model._model(abpn_upsampled)

example_detections.show()
abpn_detections.show()

example_detections = benthic_model._model(example_image)
esrgan_detections = benthic_model._model(esrgan_upsampled)

example_detections.show()
esrgan_detections.show()

example_detections = benthic_model._model(example_image)
hat_detections = benthic_model._model(hat_upsampled)

example_detections.show()
hat_detections.show()

abpn_model_path

PosixPath('/Users/per.morten.halvorsen@schibsted.com/personal/models/sr_mobile_python/models_modelx4.ort')

benthic_model_weights_path

PosixPath('/Users/per.morten.halvorsen@schibsted.com/personal/models/fathomnet_benthic/mbari-mb-benthic-33k.pt')

class YOLOv5ModelWithUpsample(YOLOv5Model, torch.nn.Module):
    def __init__(
            self, 
            detection_model_path: str = benthic_model_weights_path,  
            upsample_model: Union[ABPN, ESRGAN, Hat, None] = None
        ):
        super().__init__(detection_model_path)
        self.upsample_model = upsample_model


    def forward(self, X: List[str]):
        if self.upsample_model:
            X = self.upsample_model.upsample(X)
        return self._model(X)

abpn_pipeline = YOLOv5ModelWithUpsample(benthic_model_weights_path, abpn_model)

abpn_detections = abpn_pipeline.forward([str(example_image_path)])  # upsample expects a list of image paths

abpn_detections.show()

Using cache found in /Users/per.morten.halvorsen@schibsted.com/.cache/torch/hub/ultralytics_yolov5_master
YOLOv5 🚀 2024-3-16 Python-3.11.5 torch-2.2.1 CPU

Fusing layers... 
Model summary: 476 layers, 91841704 parameters, 0 gradients
Adding AutoShape...

  0%|          | 0/1 [00:00<?, ?it/s]

esrgan_pipeline = YOLOv5ModelWithUpsample(benthic_model_weights_path, esrgan_model)

esrgan_detections = esrgan_pipeline.forward([str(example_image_path)])  # upsample expects a list of image paths

esrgan_detections.show()

Using cache found in /Users/per.morten.halvorsen@schibsted.com/.cache/torch/hub/ultralytics_yolov5_master
YOLOv5 🚀 2024-3-16 Python-3.11.5 torch-2.2.1 CPU

Fusing layers... 
Model summary: 476 layers, 91841704 parameters, 0 gradients
Adding AutoShape...

  0%|          | 0/1 [00:00<?, ?it/s]

hat_pipeline = YOLOv5ModelWithUpsample(benthic_model_weights_path, hat_model)

hat_detections = hat_pipeline.forward([str(example_image_path)])  # upsample expects a list of image paths

hat_detections.show()

Using cache found in /Users/per.morten.halvorsen@schibsted.com/.cache/torch/hub/ultralytics_yolov5_master
YOLOv5 🚀 2024-3-16 Python-3.11.5 torch-2.2.1 CPU

Fusing layers... 
Model summary: 476 layers, 91841704 parameters, 0 gradients
Adding AutoShape...

  0%|          | 0/1 [00:00<?, ?it/s]

def forward(self, X: List[str]):
    return self._model(X)

benthic_model.forward = forward.__get__(benthic_model)

example_detections = benthic_model.forward([str(example_image_path)])
example_detections.show()

N = 5

raw_starfish_detections = benthic_model.forward(starfish_images[:N])
# raw_starfish_detections.show()

abpn_starfish_detections = abpn_pipeline.forward(starfish_images[:N])  
# abpn_starfish_detections.show()

  0%|          | 0/5 [00:00<?, ?it/s]

esrgan_starfish_detections = esrgan_pipeline.forward(starfish_images[:N])  
# esrgan_starfish_detections.show()

  0%|          | 0/5 [00:00<?, ?it/s]

hat_starfish_detections = hat_pipeline.forward(starfish_images[:N])  
# hat_starfish_detections.show()

  0%|          | 0/5 [00:00<?, ?it/s]

# rebuild somneeded params locally 
trashcan_ids = {
    row["supercategory"]: id
    for id, row in trashcan_data.cats.items()
}

# find trash index
trash_idx = list(benthic_model._model.names.values()).index("trash")
print(benthic_model._model.names[trash_idx])

# find trash labels 
trashcan_trash_labels = {
    id: name
    for name, id in trashcan_ids.items()
    if name.startswith("trash")
}
trashcan_trash_labels

trash

{9: 'trash_etc',
 10: 'trash_fabric',
 11: 'trash_fishing_gear',
 12: 'trash_metal',
 13: 'trash_paper',
 14: 'trash_plastic',
 15: 'trash_rubber',
 16: 'trash_wood'}

# replace str keys with ints
benthic2trashcan_ids = {
    int(key): value 
    for key, value in benthic2trashcan_ids.items()
}

raw_starfish_metrics = evaluate_model(
    category="animal_starfish",
    data=trashcan_data,
    model=benthic_model,
    id_map=benthic2trashcan_ids,
    one_idx=trash_idx,
    many_idx=trashcan_trash_labels,
    exclude_ids=[trashcan_ids["rov"], trashcan_ids["plant"]],
    path_prefix=data_dir / "dataset" / "material_version" / "val"
)

raw_starfish_metrics["time"]

Precision: 0.37209301460248806
Recall: 0.07920792039996079
Average IoU: tensor(0.29560)

46.661787033081055

abpn_starfish_metrics = evaluate_model(
    category="animal_starfish",
    data=trashcan_data,
    model=abpn_pipeline,
    id_map=benthic2trashcan_ids,
    one_idx=trash_idx,
    many_idx=trashcan_trash_labels,
    exclude_ids=[trashcan_ids["rov"], trashcan_ids["plant"]],
    path_prefix=data_dir / "dataset" / "material_version" / "val",
    x_scale=4,  # TODO define variable
    y_scale=4
)

abpn_starfish_metrics["time"]

  0%|          | 0/46 [00:00<?, ?it/s]

Precision: 0.20312499682617194
Recall: 0.06435643532496814
Average IoU: tensor(0.15016)

52.08669114112854

esrgan_starfish_metrics = evaluate_model(
    category="animal_starfish",
    data=trashcan_data,
    model=esrgan_pipeline,
    id_map=benthic2trashcan_ids,
    one_idx=trash_idx,
    many_idx=trashcan_trash_labels,
    exclude_ids=[trashcan_ids["rov"], trashcan_ids["plant"]],
    path_prefix=data_dir / "dataset" / "material_version" / "val",
    x_scale=4,  # TODO define variable
    y_scale=4
)

esrgan_starfish_metrics["time"]

  0%|          | 0/46 [00:00<?, ?it/s]

Precision: 0.2142857117346939
Recall: 0.08910891044995589
Average IoU: tensor(0.17836)

108.11618709564209

hat_starfish_metrics = evaluate_model(
    category="animal_starfish",
    data=trashcan_data,
    model=hat_pipeline,
    id_map=benthic2trashcan_ids,
    one_idx=trash_idx,
    many_idx=trashcan_trash_labels,
    exclude_ids=[trashcan_ids["rov"], trashcan_ids["plant"]],
    path_prefix=data_dir / "dataset" / "material_version" / "val",
    x_scale=4,  # TODO define variable
    y_scale=4
)

hat_starfish_metrics["time"]

  0%|          | 0/46 [00:00<?, ?it/s]

Precision: 0.43478259924385654
Recall: 0.099009900499951
Average IoU: tensor(0.34594)

377.19130969047546

def evaluate(model, category, name="", N=20):

    # profiler allows us to check the memory consumption
    with profile(activities=[ProfilerActivity.CPU], profile_memory=True) as prof:
        print()
        metrics = evaluate_model(
            category=category,
            data=trashcan_data,
            model=model,
            id_map=benthic2trashcan_ids,
            N=N,
            one_idx=trash_idx,
            many_idx=trashcan_trash_labels,
            exclude_ids=[trashcan_ids["rov"], trashcan_ids["plant"]],
            path_prefix=data_dir / "dataset" / "material_version" / "val",
            x_scale=4,  # TODO define variable
            y_scale=4
        )
        print(name.upper(), "Model")
        print()

    print(prof.key_averages().table(sort_by="self_cpu_memory_usage", row_limit=5))

    return metrics

raw_fish_metrics = evaluate(benthic_model, "animal_fish", "benthic")
abpn_fish_metrics = evaluate(abpn_pipeline, "animal_fish", "abpn")
esrgan_fish_metrics = evaluate(esrgan_pipeline, "animal_fish", "esrgan")
hat_fish_metrics = evaluate(hat_pipeline, "animal_fish", "hat")

STAGE:2024-03-11 23:01:22 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

Precision: 0.0
Recall: 0.0
Average IoU: 0.0
BENTHIC Model

STAGE:2024-03-11 23:01:48 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:01:48 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing

-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                                 Name    Self CPU %      Self CPU   CPU total %     CPU total  CPU time avg       CPU Mem  Self CPU Mem    # of Calls  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                          aten::empty         0.00%     796.000us         0.00%     796.000us       2.449us       8.49 Gb       8.49 Gb           325  
                            aten::cat         0.50%     126.437ms         0.50%     126.636ms       4.367ms       3.20 Gb       3.20 Gb            29  
                            aten::add         0.23%      58.814ms         0.23%      58.841ms     486.289us       1.49 Gb       1.49 Gb           121  
                        aten::sigmoid         0.34%      85.547ms         0.34%      85.547ms      28.516ms    1003.60 Mb    1003.60 Mb             3  
        aten::max_pool2d_with_indices         1.55%     396.735ms         1.55%     396.735ms     132.245ms     131.84 Mb     131.84 Mb             3  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
Self CPU time total: 25.514s

STAGE:2024-03-11 23:01:48 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

  0%|          | 0/20 [00:00<?, ?it/s]

Precision: 0.33333327777778704
Recall: 0.03389830451019823
Average IoU: tensor(0.26626)
ABPN Model

STAGE:2024-03-11 23:02:16 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:02:16 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing

-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                                 Name    Self CPU %      Self CPU   CPU total %     CPU total  CPU time avg       CPU Mem  Self CPU Mem    # of Calls  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                          aten::empty         0.00%     741.000us         0.00%     741.000us       2.352us       8.54 Gb       8.54 Gb           315  
                            aten::cat         0.92%     237.498ms         0.92%     237.749ms      10.337ms       3.20 Gb       3.20 Gb            23  
                            aten::add         0.21%      54.901ms         0.21%      54.962ms     495.153us       1.49 Gb       1.49 Gb           111  
                        aten::sigmoid         0.36%      92.160ms         0.36%      92.160ms      30.720ms    1003.60 Mb    1003.60 Mb             3  
        aten::max_pool2d_with_indices         1.53%     395.412ms         1.53%     395.412ms     131.804ms     131.84 Mb     131.84 Mb             3  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
Self CPU time total: 25.921s

raw_crab_metrics = evaluate(benthic_model, "animal_crab", "benthic")
abpn_crab_metrics = evaluate(abpn_pipeline, "animal_crab", "abpn")
esrgan_crab_metrics = evaluate(esrgan_pipeline, "animal_crab", "esrgan")
hat_crab_metrics = evaluate(hat_pipeline, "animal_crab", "hat")

STAGE:2024-03-11 23:05:55 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

Precision: 0.0
Recall: 0.0
Average IoU: 0.0
BENTHIC Model

STAGE:2024-03-11 23:06:21 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:06:21 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing

-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                                 Name    Self CPU %      Self CPU   CPU total %     CPU total  CPU time avg       CPU Mem  Self CPU Mem    # of Calls  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                          aten::empty         0.00%     707.000us         0.00%     707.000us       1.704us       8.54 Gb       8.54 Gb           415  
                            aten::cat         2.78%     710.329ms         2.78%     710.547ms      20.898ms       3.20 Gb       3.20 Gb            34  
                            aten::add         0.20%      51.887ms         0.20%      52.080ms     186.000us       1.49 Gb       1.49 Gb           280  
                        aten::sigmoid         0.41%     105.032ms         0.41%     105.032ms      35.011ms    1003.60 Mb    1003.60 Mb             3  
        aten::max_pool2d_with_indices         1.50%     384.054ms         1.50%     384.054ms     128.018ms     131.84 Mb     131.84 Mb             3  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
Self CPU time total: 25.533s

STAGE:2024-03-11 23:06:23 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

  0%|          | 0/20 [00:00<?, ?it/s]

Precision: 0.013333333155555559
Recall: 0.01149425274144537
Average IoU: tensor(0.01037)
ABPN Model

STAGE:2024-03-11 23:06:50 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:06:50 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing

-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                                 Name    Self CPU %      Self CPU   CPU total %     CPU total  CPU time avg       CPU Mem  Self CPU Mem    # of Calls  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                          aten::empty         0.00%     725.000us         0.00%     725.000us       1.959us       8.54 Gb       8.54 Gb           370  
                            aten::cat         1.26%     324.732ms         1.26%     324.930ms      11.204ms       3.20 Gb       3.20 Gb            29  
                            aten::add         0.22%      56.119ms         0.22%      56.607ms     112.093us       1.49 Gb       1.49 Gb           505  
                        aten::sigmoid         0.44%     113.767ms         0.44%     113.767ms      37.922ms    1003.60 Mb    1003.60 Mb             3  
        aten::max_pool2d_with_indices         1.49%     382.600ms         1.49%     382.600ms     127.533ms     131.84 Mb     131.84 Mb             3  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
Self CPU time total: 25.694s

raw_eel_metrics = evaluate(benthic_model, "animal_eel", "benthic")
abpn_eel_metrics = evaluate(abpn_pipeline, "animal_eel", "abpn")
esrgan_eel_metrics = evaluate(esrgan_pipeline, "animal_eel", "esrgan")
hat_eel_metrics = evaluate(hat_pipeline, "animal_eel", "hat")

STAGE:2024-03-11 23:29:59 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up
[W CPUAllocator.cpp:235] Memory block of unknown size was allocated before the profiling started, profiler results will not include the deallocation event

Precision: 0.0
Recall: 0.0
Average IoU: 0.0
BENTHIC Model

STAGE:2024-03-11 23:30:21 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:30:21 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing

-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                                 Name    Self CPU %      Self CPU   CPU total %     CPU total  CPU time avg       CPU Mem  Self CPU Mem    # of Calls  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                          aten::empty         0.00%     752.000us         0.00%     752.000us       2.173us       6.95 Gb       6.95 Gb           346  
                            aten::cat         5.80%        1.248s         5.80%        1.249s      35.675ms       2.56 Gb       2.56 Gb            35  
                            aten::add         0.19%      41.607ms         0.19%      41.632ms     315.394us       1.19 Gb       1.19 Gb           132  
                        aten::sigmoid         0.38%      82.467ms         0.38%      82.467ms      27.489ms     802.88 Mb     802.88 Mb             3  
        aten::max_pool2d_with_indices         1.36%     293.307ms         1.36%     293.307ms      97.769ms     105.47 Mb     105.47 Mb             3  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
Self CPU time total: 21.522s

STAGE:2024-03-11 23:30:22 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

  0%|          | 0/20 [00:00<?, ?it/s]

Precision: 0.0
Recall: 0.0
Average IoU: 0.0
ABPN Model

STAGE:2024-03-11 23:30:45 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:30:45 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing

-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                                 Name    Self CPU %      Self CPU   CPU total %     CPU total  CPU time avg       CPU Mem  Self CPU Mem    # of Calls  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                          aten::empty         0.00%     792.000us         0.00%     792.000us       2.336us       6.95 Gb       6.95 Gb           339  
                            aten::cat         1.11%     237.958ms         1.11%     238.214ms       8.214ms       2.56 Gb       2.56 Gb            29  
                            aten::add         0.19%      40.676ms         0.19%      40.703ms     357.044us       1.19 Gb       1.19 Gb           114  
                        aten::sigmoid         0.49%     105.003ms         0.49%     105.003ms      35.001ms     802.88 Mb     802.88 Mb             3  
                     aten::empty_like         0.00%      33.000us         0.00%     104.000us       2.419us     978.66 Mb     152.93 Mb            43  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
Self CPU time total: 21.427s

raw_shell_metrics = evaluate(benthic_model, "animal_shell", "benthic")
abpn_shell_metrics = evaluate(abpn_pipeline, "animal_shell", "abpn")
esrgan_shell_metrics = evaluate(esrgan_pipeline, "animal_shell", "esrgan")
hat_shell_metrics = evaluate(hat_pipeline, "animal_shell", "hat")

STAGE:2024-03-11 23:10:55 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

Precision: 0.0
Recall: 0.0
Average IoU: 0.0
BENTHIC Model

STAGE:2024-03-11 23:11:21 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:11:21 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing
STAGE:2024-03-11 23:11:21 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                                 Name    Self CPU %      Self CPU   CPU total %     CPU total  CPU time avg       CPU Mem  Self CPU Mem    # of Calls  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                          aten::empty         0.00%     722.000us         0.00%     722.000us       2.337us       8.35 Gb       8.35 Gb           309  
                            aten::cat         3.30%     843.995ms         3.30%     844.226ms      31.268ms       3.20 Gb       3.20 Gb            27  
                            aten::add         0.20%      51.719ms         0.20%      51.725ms     533.247us       1.49 Gb       1.49 Gb            97  
                        aten::sigmoid         0.39%      99.917ms         0.39%      99.917ms      33.306ms    1003.60 Mb    1003.60 Mb             3  
                     aten::empty_like         0.00%      26.000us         0.00%      60.000us       2.069us       1.05 Gb     238.95 Mb            29  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
Self CPU time total: 25.552s

  0%|          | 0/20 [00:00<?, ?it/s]

Precision: 0.0
Recall: 0.0
Average IoU: 0.0
ABPN Model

STAGE:2024-03-11 23:11:49 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:11:49 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing

-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                                 Name    Self CPU %      Self CPU   CPU total %     CPU total  CPU time avg       CPU Mem  Self CPU Mem    # of Calls  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                          aten::empty         0.00%     717.000us         0.00%     717.000us       2.328us       8.54 Gb       8.54 Gb           308  
                            aten::cat         1.04%     270.200ms         1.04%     270.423ms      10.401ms       3.20 Gb       3.20 Gb            26  
                            aten::add         0.21%      55.376ms         0.21%      55.462ms     338.183us       1.49 Gb       1.49 Gb           164  
                        aten::sigmoid         0.45%     117.408ms         0.45%     117.408ms      39.136ms    1003.60 Mb    1003.60 Mb             3  
        aten::max_pool2d_with_indices         1.48%     385.957ms         1.48%     385.957ms     128.652ms     131.84 Mb     131.84 Mb             3  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
Self CPU time total: 26.001s

STAGE:2024-03-11 23:11:49 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

raw_trash_metrics = evaluate(benthic_model, "trash_plastic", "benthic")
abpn_trash_metrics = evaluate(abpn_pipeline, "trash_plastic", "abpn")
esrgan_trash_metrics = evaluate(esrgan_pipeline, "trash_plastic", "esrgan")
hat_trash_metrics = evaluate(hat_pipeline, "trash_plastic", "hat")

STAGE:2024-03-11 23:15:27 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

Precision: 0.0
Recall: 0.0
Average IoU: 0.0
BENTHIC Model

STAGE:2024-03-11 23:15:53 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:15:53 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing

-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                                 Name    Self CPU %      Self CPU   CPU total %     CPU total  CPU time avg       CPU Mem  Self CPU Mem    # of Calls  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                          aten::empty         0.00%     672.000us         0.00%     672.000us       2.161us       8.54 Gb       8.54 Gb           311  
                            aten::cat         1.70%     432.191ms         1.70%     432.402ms      18.017ms       3.20 Gb       3.20 Gb            24  
                            aten::add         0.20%      50.950ms         0.20%      50.975ms     485.476us       1.49 Gb       1.49 Gb           105  
                        aten::sigmoid         0.39%      99.362ms         0.39%      99.362ms      33.121ms    1003.60 Mb    1003.60 Mb             3  
                     aten::empty_like         0.00%      54.000us         0.00%      69.000us       2.556us       1.05 Gb     764.65 Mb            27  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
Self CPU time total: 25.423s

STAGE:2024-03-11 23:15:53 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

  0%|          | 0/20 [00:00<?, ?it/s]

Precision: 0.035714284438775556
Recall: 0.014084506843880186
Average IoU: tensor(0.02660)
ABPN Model

STAGE:2024-03-11 23:16:22 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:16:22 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing

-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                                 Name    Self CPU %      Self CPU   CPU total %     CPU total  CPU time avg       CPU Mem  Self CPU Mem    # of Calls  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                          aten::empty         0.00%     765.000us         0.00%     765.000us       2.243us       8.51 Gb       8.51 Gb           341  
                            aten::cat         1.22%     320.818ms         1.22%     321.030ms      11.890ms       3.20 Gb       3.20 Gb            27  
                            aten::add         0.20%      53.035ms         0.20%      53.274ms     189.587us       1.49 Gb       1.49 Gb           281  
                        aten::sigmoid         0.38%      99.780ms         0.38%      99.780ms      33.260ms    1003.60 Mb    1003.60 Mb             3  
                     aten::empty_like         0.00%      58.000us         0.00%      73.000us       1.780us       1.00 Gb     955.81 Mb            41  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
Self CPU time total: 26.403s

raw_metal_metrics = evaluate(benthic_model, "trash_metal", "benthic")
abpn_metal_metrics = evaluate(abpn_pipeline, "trash_metal", "abpn")
esrgan_metal_metrics = evaluate(esrgan_pipeline, "trash_metal", "esrgan")
hat_metal_metrics = evaluate(hat_pipeline, "trash_metal", "hat")

STAGE:2024-03-11 23:20:05 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

Precision: 0.0
Recall: 0.0
Average IoU: 0.0
BENTHIC Model

STAGE:2024-03-11 23:20:31 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:20:31 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing

-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                                 Name    Self CPU %      Self CPU   CPU total %     CPU total  CPU time avg       CPU Mem  Self CPU Mem    # of Calls  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                          aten::empty         0.00%     671.000us         0.00%     671.000us       1.997us       8.54 Gb       8.54 Gb           336  
                            aten::cat         3.65%     950.446ms         3.65%     950.676ms      35.210ms       3.20 Gb       3.20 Gb            27  
                            aten::add         0.20%      51.024ms         0.20%      51.102ms     313.509us       1.49 Gb       1.49 Gb           163  
                        aten::sigmoid         0.38%      97.993ms         0.38%      97.993ms      32.664ms    1003.60 Mb    1003.60 Mb             3  
        aten::max_pool2d_with_indices         1.48%     386.081ms         1.48%     386.081ms     128.694ms     131.84 Mb     131.84 Mb             3  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
Self CPU time total: 26.074s

STAGE:2024-03-11 23:20:32 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

  0%|          | 0/20 [00:00<?, ?it/s]

Precision: 0.0
Recall: 0.0
Average IoU: 0.0
ABPN Model

STAGE:2024-03-11 23:20:59 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:20:59 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing

-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                                 Name    Self CPU %      Self CPU   CPU total %     CPU total  CPU time avg       CPU Mem  Self CPU Mem    # of Calls  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                          aten::empty         0.00%     734.000us         0.00%     734.000us       2.128us       8.54 Gb       8.54 Gb           345  
                            aten::cat         0.78%     200.175ms         0.78%     200.389ms       7.422ms       3.20 Gb       3.20 Gb            27  
                            aten::add         0.22%      55.845ms         0.22%      56.055ms     219.824us       1.49 Gb       1.49 Gb           255  
                        aten::sigmoid         0.45%     116.273ms         0.45%     116.273ms      38.758ms    1003.60 Mb    1003.60 Mb             3  
        aten::max_pool2d_with_indices         1.50%     385.711ms         1.50%     385.711ms     128.570ms     131.84 Mb     131.84 Mb             3  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
Self CPU time total: 25.660s

raw_wood_metrics = evaluate(benthic_model, "trash_wood", "benthic")
abpn_wood_metrics = evaluate(abpn_pipeline, "trash_wood", "abpn")
esrgan_wood_metrics = evaluate(esrgan_pipeline, "trash_wood", "esrgan")
hat_wood_metrics = evaluate(hat_pipeline, "trash_wood", "hat")

STAGE:2024-03-11 23:24:32 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

Precision: 0.0
Recall: 0.0
Average IoU: 0.0
BENTHIC Model

-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                                 Name    Self CPU %      Self CPU   CPU total %     CPU total  CPU time avg       CPU Mem  Self CPU Mem    # of Calls  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                          aten::empty         0.00%     761.000us         0.00%     761.000us       2.606us       8.54 Gb       8.54 Gb           292  
                            aten::cat         1.48%     373.154ms         1.48%     373.359ms      16.233ms       3.20 Gb       3.20 Gb            23  
                            aten::add         0.23%      57.015ms         0.23%      57.020ms     647.955us       1.49 Gb       1.49 Gb            88  
                        aten::sigmoid         0.38%      94.688ms         0.38%      94.688ms      31.563ms    1003.60 Mb    1003.60 Mb             3  
        aten::max_pool2d_with_indices         1.53%     385.242ms         1.53%     385.242ms     128.414ms     131.84 Mb     131.84 Mb             3  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
Self CPU time total: 25.242s

STAGE:2024-03-11 23:24:57 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:24:57 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing
STAGE:2024-03-11 23:24:58 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

  0%|          | 0/20 [00:00<?, ?it/s]

Precision: 0.0
Recall: 0.0
Average IoU: 0.0
ABPN Model

-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                                 Name    Self CPU %      Self CPU   CPU total %     CPU total  CPU time avg       CPU Mem  Self CPU Mem    # of Calls  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
                          aten::empty         0.00%     752.000us         0.00%     752.000us       2.541us       8.54 Gb       8.54 Gb           296  
                            aten::cat         1.27%     326.029ms         1.27%     326.242ms      14.184ms       3.20 Gb       3.20 Gb            23  
                            aten::add         0.21%      54.261ms         0.21%      54.267ms     616.670us       1.49 Gb       1.49 Gb            88  
                        aten::sigmoid         0.36%      90.993ms         0.36%      90.993ms      30.331ms    1003.60 Mb    1003.60 Mb             3  
        aten::max_pool2d_with_indices         1.50%     382.867ms         1.50%     382.867ms     127.622ms     131.84 Mb     131.84 Mb             3  
-------------------------------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  ------------  
Self CPU time total: 25.588s

STAGE:2024-03-11 23:25:25 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:25:25 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing
STAGE:2024-03-11 23:25:25 30539:143864 ActivityProfilerController.cpp:314] Completed Stage: Warm Up

  0%|          | 0/20 [00:00<?, ?it/s]

Precision: 0.0
Recall: 0.0
Average IoU: tensor(0.08112)
ESRGAN Model

STAGE:2024-03-11 23:26:23 30539:143864 ActivityProfilerController.cpp:320] Completed Stage: Collection
STAGE:2024-03-11 23:26:23 30539:143864 ActivityProfilerController.cpp:324] Completed Stage: Post Processing

Model	Category	Precision	Recall	Average IoU	Elapsed time	Peak memory
Basic	Crab	0.0	0.00	0.0	25.53 s	8.54 Gb
ABPN	Crab	0.0133	0.0115	0.0104	25.69 s	8.54 Gb
ESRGAN	Crab	0.0087	0.0115	0.0092	54.50 s	8.54 Gb
HAT	Crab	0.1111	0.0230	0.1018	166.85 s	26.07 Gb
Basic	Eel	0.0	0.0	0.0	21.52 s	6.95 Gb
ABPN	Eel	0.0	0.0	0.0	21.43 s	6.95 Gb
ESRGAN	Eel	0.2857	0.0833	0.2197	45.91 s	6.95 Gb
HAT	Eel	0.3636	0.0833	0.2739	114.02 s	20.02 Gb
Basic	Fish	0.0	0.0	0.0	25.51 s	8.49 Gb
ABPN	Fish	0.3333	0.0339	0.2662	25.92 s	8.54 Gb
ESRGAN	Fish	0.1667	0.0339	0.1354	52.82 s	8.34 Gb
HAT	Fish	0.5000	0.0508	0.3851	151.14 s	24.00 Gb
Basic	Shell	0.0	0.0	0.0	25.55 s	8.35 Gb
ABPN	Shell	0.0	0.0	0.0	26.00 s	8.54 Gb
ESRGAN	Shell	0.0	0.0	0.0	52.72 s	8.54 Gb
HAT	Shell	0.0	0.0	0.0	150.23 s	23.55 Gb
Basic	Starfish	0.3720	0.0792	0.2956	46.45 s	-
ABPN	Starfish	0.2031	0.0643	0.1501	52.09 s	-
ESRGAN	Starfish	0.2142	0.0891	0.1784	108.12 s	-
HAT	Starfish	0.4347	0.0990	0.3460	377.19 s	-

Model	Category	Precision	Recall	Average IoU	Elapsed time	Peak Memory
Basic	Metal	0.0	0.0	0.0	26.07 s	8.54 Gb
ABPN	Metal	0.0	0.0	0.0	25.66 s	8.54 Gb
ESRGAN	Metal	0.0	0.0	0.0	52.92 s	8.35 Gb
HAT	Metal	0.2000	0.0161	0.1695	143.19 s	23.48 Gb
Basic	Trash	0.0	0.0	0.0	25.42 s	8.54 Gb
ABPN	Trash	0.0357	0.0141	0.0266	26.40 s	8.51 Gb
ESRGAN	Trash	0.2500	0.0140	0.1860	54.68 s	8.53 Gb
HAT	Trash	0.2857	0.0282	0.2066	152.13 s	23.48 Gb
Basic	Wood	0.0	0.0	0.0	25.24 s	8.54 Gb
ABPN	Wood	0.0	0.0	0.0	25.59 s	8.54 Gb
ESRGAN	Wood	0.0	0.0	0.0	56.71 s	8.48 Gb
HAT	Wood	0.0	0.0	0.0	201.67 s	28.86 Gb

Model	mAP	Macro average IoU	Average time	Average Memory
Basic	0.0465	0.0370	27.66 s	8.279 Gb
ABPN	0.0881	0.0567	28.60 s	8.309 Gb
ESRGAN	0.1157	0.0911	59.80 s	8.247 Gb
HAT	0.2369	0.1854	182.05 s	24.21 Gb

Super-resolution Benthic Object Detection¶

Setup¶

Install dependencies¶

Temporary note¶

Imports¶

Paths¶

HAT model imports¶

Reuse code from previous notebook¶

Load¶

Super resolution model¶

Background¶

Motivation¶

Convolutions¶

Super-resolution models¶

ABPN: Anchor-based Plain Net for Mobile Image Super-Resolution

ESRGAN: Enhanced Super-Resolution Generative Adversarial Networks

HAT: Hybrid Attention Transformer for Image Restoration

Implementation¶

Steps¶

Super resolution on a single image¶

ABPN¶

ESRGAN¶

HAT: Hybrid Attention Transformer for Image Restoration¶

Single SR image to Benthic Object Detector¶

ABPN¶

ESRGAN¶

HAT¶

Build prediction pipeline¶

Full category classifications¶

Evaluation¶

Run evaluation¶

Metrics for all categories¶

Fish¶

Crab¶

Eel¶

Shells¶

Trash¶

Metal¶

Wood¶

Results¶

Animals categories¶

Trash categories¶

Averaged metrics¶

Analysis¶

Conclusion¶

Future work¶

Comments on implementation¶

Up next: Multi-object tracking¶

Up next: Multi-object tracking ¶