%load_ext autoreload
%autoreload 2

!ls data/train

rg20210310_mask.png  rg20210407_mask.png  rg20211103_mask.png  taxa.csv
rg20210310_scan.png  rg20210407_scan.png  rg20211103_scan.png

!for f in data/train/*_scan.png; do file $f; done

data/train/rg20210310_scan.png: PNG image data, 22737 x 14503, 8-bit grayscale, non-interlaced
data/train/rg20210407_scan.png: PNG image data, 22707 x 14373, 8-bit grayscale, non-interlaced
data/train/rg20211103_scan.png: PNG image data, 22747 x 14573, 8-bit grayscale, non-interlaced

!cat data/train/taxa.csv

label,living,label_nb
artefact,False,1
badfocus<artefact,False,2
bubble,False,3
detritus,False,4
fiber<detritus,False,5
t001,False,6
t003,False,7
Acartiidae,True,8
Actinopterygii,True,9
Aglaura,True,10
Annelida,True,11
Aulacantha,True,12
Calanidae,True,13
Calanoida,True,14
Candaciidae,True,15
Cavolinia inflexa,True,16
Centropagidae,True,17
Chaetognatha,True,18
Chelophyes appendiculata,True,19
Collodaria,True,20
Corycaeidae,True,21
Creseidae,True,22
Creseis acicula,True,23
Doliolida,True,24
Euchaetidae,True,25
Eumalacostraca,True,26
Evadne,True,27
Flaccisagitta enflata,True,28
Fritillariidae,True,29
Gammaridea,True,30
Globigerinidae,True,31
Gymnosomata,True,32
Harpacticoida,True,33
Heterorhabdidae,True,34
Hydrozoa,True,35
Hyperiidea,True,36
Insecta,True,37
Limacinidae,True,38
Metridinidae,True,39
Neoceratium,True,40
Oikopleuridae,True,41
Oithonidae,True,42
Oncaeidae,True,43
Orbulina,True,44
Ostracoda,True,45
Penilia avirostris,True,46
Podon,True,47
Rhizaria,True,48
Rhopalonema velatum,True,49
Salpida,True,50
Sapphirinidae,True,51
Temoridae,True,52
bract<Abylopsis tetragona,True,53
bract<Diphyidae,True,54
calyptopsis<Euphausiacea,True,55
colony<Phaeodaria,True,56
damaged<Aulacantha,True,57
egg<Actinopterygii,True,58
egg<Mollusca,True,59
egg<other,True,60
endostyle<Salpidae,True,61
eudoxie<Diphyidae,True,62
gonophore<Abylopsis tetragona,True,63
gonophore<Diphyidae,True,64
head<Chaetognatha,True,65
juvenile<Salpida,True,66
larvae<Porcellanidae,True,67
like<Collodaria,True,68
multiple<other,True,69
nectophore<Diphyidae,True,70
nectophore<Physonectae,True,71
nucleus<Salpidae,True,72
othertocheck,True,73
part<Cnidaria,True,74
part<Crustacea,True,75
part<Mollusca,True,76
part<Siphonophorae,True,77
part<Thaliacea,True,78
pluteus<Echinoidea,True,79
pluteus<Ophiuroidea,True,80
protozoea<Mysida,True,81
seaweed,True,82
siphonula,True,83
tail<Appendicularia,True,84
tail<Chaetognatha,True,85
trunk<Appendicularia,True,86
zoea<Brachyura,True,87
zoea<Galatheidae,True,88

# Standard imports
import pathlib

# External imports
import albumentations as A
import numpy as np
import matplotlib.pyplot as plt
import torch
import yaml

# Local imports
from planktoseg import data
from planktoseg import models
from planktoseg import optim
from planktoseg import utils
from planktoseg import metrics
from planktoseg import main

use_cuda = torch.cuda.is_available()
device = torch.device("cuda") if use_cuda else torch.device("cpu")

logdir = pathlib.Path("./logs")
if not logdir.exists():
    logdir.mkdir(exist_ok=True)

/usr/users/dce-admin/fix/GIT/2024_ml4oceans/venv/lib/python3.10/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html
  from .autonotebook import tqdm as notebook_tqdm

transform = A.pytorch.ToTensorV2()

dataset = data.PlanktonDataset(root="./data/train", patch_size=(512, 512), patch_stride=(128, 128), task=data.SegmentationTask.LIVING_NONLIVING)
dataset = data.WrappedDataset(dataset, transform)

  0%|          | 0/3 [00:00<?, ?it/s]

100%|██████████| 3/3 [00:12<00:00,  4.07s/it]

idx = np.random.randint(len(dataset)) 

img, mask = dataset[idx]

print(f"The img is of type {type(img)} and of shape {img.shape}")
print(f"The mask is of type {type(mask)} and of shape {mask.shape}")

plt.subplot(1, 2, 1)
plt.imshow(img.squeeze(), cmap="gray")
plt.title("Zooscan image")
plt.axis("off")

plt.subplot(1, 2, 2)
plt.imshow(mask.squeeze(), interpolation="none", cmap="tab20c")
plt.title("Mask")
plt.axis("off")

The img is of type <class 'torch.Tensor'> and of shape torch.Size([1, 512, 512])
The mask is of type <class 'torch.Tensor'> and of shape torch.Size([512, 512])

(np.float64(-0.5), np.float64(511.5), np.float64(511.5), np.float64(-0.5))

idx = np.random.randint(len(dataset)) 
idx = 50807

# Sample the dataset without all the transforms
# to see what the image and mask originally look like
original_transform = A.pytorch.ToTensorV2()
dataset.transform = original_transform
orig_img, orig_mask = dataset[idx]

##########################################################################################
# TODO: You have to fill this part !
# Tune the augmented transform by prepending your choosen transform before the 
# conversion to pytorch tensor
# Fill free to evaluate the cell as you add transforms to see their effect
transform = A.Compose([
    A.HorizontalFlip(p=0.5),
    A.RandomRotate90(p=0.5),
    A.MaskDropout((1, 1), image_fill_value=255, p=1), 
    A.Blur(),
    A.pytorch.ToTensorV2()
])
##########################################################################################

# And now sample the exact same image/mask 
dataset.transform = transform
aug_img, aug_mask = dataset[idx]

plt.subplot(2, 2, 1)
plt.imshow(orig_img.squeeze(), cmap="gray", clim=(0, 255))
plt.title("Zooscan original")
plt.axis("off")

plt.subplot(2, 2, 2)
plt.imshow(orig_mask.squeeze(), interpolation="none", cmap="tab20c")
plt.title("Original Mask")
plt.axis("off")

plt.subplot(2, 2, 3)
plt.imshow(aug_img.squeeze(), cmap="gray", clim=(0, 255))
plt.title("Zooscan augmented image")
plt.axis("off")

plt.subplot(2, 2, 4)
plt.imshow(aug_mask.squeeze(), interpolation="none", cmap="tab20c")
plt.title("Augmented mask")
plt.axis("off")

(np.float64(-0.5), np.float64(511.5), np.float64(511.5), np.float64(-0.5))

# The configuration below requires 22GB of VRAM
data_config = {"trainpath": "./data/train", 
               "valid_ratio": 0.2,
               "batch_size": 32,
               "num_workers": 7,
               "patch_size": (256, 256),
               "patch_stride": (128, 128),
               "task": "living_nonliving",
               "normalize": True}

train_loader, valid_loader, input_size, num_classes, normalizing_stats = data.get_dataloaders(data_config, use_cuda)

# The normalizing statistics must be saved because they will be need for inference
with open(logdir / "normalizing_stats.yaml", "w") as file:
    yaml.dump(normalizing_stats, file)

  0%|          | 0/3 [00:00<?, ?it/s]

100%|██████████| 3/3 [00:12<00:00,  4.06s/it]
100%|██████████| 1474/1474 [00:49<00:00, 29.98it/s]

print(f"The train dataloaders contains {len(train_loader)} mini batches")
print(f"The valid dataloader contains {len(valid_loader)} mini batches")
print(f"Our problem contains {num_classes} classes and our inputs have the shape {input_size}")
print(f"For normalizing the input, we will be using the following statistics {normalizing_stats}")

The train dataloaders contains 1474 mini batches
The valid dataloader contains 369 mini batches
Our problem contains 2 classes and our inputs have the shape (1, 256, 256)
For normalizing the input, we will be using the following statistics {'mean': 0.8201782290938752, 'std': 0.09110527465244618}

from planktoseg.models.unet import TimmEncoder

encoder = TimmEncoder(cin=1, model_name="resnet18")
fake_input = torch.zeros(1, 1, 512, 512)
f4, [f1, f2, f3] = encoder(fake_input)

print(f"With an input of shape {fake_input.shape}, \n our model outputs tensors of shape :")
print(f" - f1 : {f1.shape}")
print(f" - f2 : {f2.shape}")
print(f" - f3 : {f3.shape}")
print(f" - f4 : {f4.shape}")

With an input of shape torch.Size([1, 1, 512, 512]), 
 our model outputs tensors of shape :
 - f1 : torch.Size([1, 64, 128, 128])
 - f2 : torch.Size([1, 128, 64, 64])
 - f3 : torch.Size([1, 256, 32, 32])
 - f4 : torch.Size([1, 512, 16, 16])

from planktoseg.models.unet import DecoderBlock, Decoder

# First test : we check the forward pass through a decoder block is working
dummy_input = torch.zeros(3, 4, 128, 128)
dummy_encoder_features = torch.zeros(3, 2, 256, 256)
block = DecoderBlock(4)
output = block(dummy_input, dummy_encoder_features)

print(f"With an input of shape {dummy_input.shape} with encoder features of shape {dummy_encoder_features.shape}, the output of the decoder block is of shape {output.shape}")

assert list(output.shape) == [3, 2, 256, 256]

# Second test : we check the forward pass through a complete decoder is working
batch_size = 3
K = 10
f1 = torch.zeros(batch_size, 64, 128, 128)
f2 = torch.zeros(batch_size, 128, 64, 64)
f3 = torch.zeros(batch_size, 256, 32, 32)
f4 = torch.zeros(batch_size, 512, 16, 16)

decoder = Decoder(num_classes = K)
output = decoder(f4, [f1, f2, f3])

print(f"The output of the decoder is of shape {output.shape}")

assert list(output.shape) == [batch_size, K, 512, 512]

With an input of shape torch.Size([3, 4, 128, 128]) with encoder features of shape torch.Size([3, 2, 256, 256]), the output of the decoder block is of shape torch.Size([3, 2, 256, 256])
The output of the decoder is of shape torch.Size([3, 10, 512, 512])

%%capture

model = models.UNet({"encoder": {"model_name": "resnet18"}}, input_size, 1 if num_classes == 2 else num_classes)
model = model.to(device)

import matplotlib.pyplot as plt
import torch
import torch.nn as nn
import torch.nn.functional as F

gamma = 2
Nsteps = 50
p = torch.linspace(0., 1., steps=Nsteps)
labels = torch.ones_like(p)

bce_loss_values = -torch.log(p)
focal_loss_values = -(1-p)**gamma * torch.log(p)

plt.figure()
plt.plot(p, bce_loss_values, label='BCE loss')
plt.plot(p, focal_loss_values, label='Focal loss')
plt.xlabel("Probability assigned to the class to be predicted")
plt.ylabel("Loss value")
plt.legend()

<matplotlib.legend.Legend at 0x7f1ce8d17430>

loss = optim.FocalLoss()

# Optimizer
optimizer = torch.optim.Adam(model.parameters(), lr=0.001)

# Metrics evaluated over the training and validation folds
train_fmetrics = {
    "focal": main.deepcs.metrics.GenericBatchMetric(loss),
    "accuracy": main.BatchAccuracy(),
    "confusion_matrix": metrics.BinaryConfusionMatrixMetric(),
}
train_fmetrics["F1"] = metrics.BinaryF1Metric()
test_fmetrics = {
    "focal": main.deepcs.metrics.GenericBatchMetric(loss),
    "accuracy": main.BatchAccuracy(),
    "confusion_matrix": metrics.BinaryConfusionMatrixMetric(),
}
test_fmetrics["F1"] = metrics.BinaryF1Metric()

# Define the early stopping callback
model_checkpoint = utils.ModelCheckpoint(
    model, logdir, (1,) + input_size, device, min_is_best=False
)

num_epochs = 2

metrics_store = {"train": [], "valid": []}

def postprocess_metrics(fmetrics, metrics_dict):
    """
    This function is used only for extracting
    the precision and recall we track for displaying and ploting
    """
    cm = fmetrics["confusion_matrix"]
    metrics_dict["precision"] = cm.get_precision()
    metrics_dict["recall"] = cm.get_recall()

# Evaluate the metrics before training
train_metrics = utils.test(model, train_loader, device, test_fmetrics)
postprocess_metrics(train_fmetrics, train_metrics)
metrics_store["train"].append(train_metrics)

valid_metrics = utils.test(model, valid_loader, device, test_fmetrics)
postprocess_metrics(test_fmetrics, valid_metrics)
metrics_store["valid"].append(valid_metrics)

for e in range(num_epochs):
        # Train 1 epoch
        train_metrics = utils.train(
            model, train_loader, loss, optimizer, device, train_fmetrics
        )
        postprocess_metrics(train_fmetrics, train_metrics)
        metrics_store["train"].append(train_metrics)

        # Test
        valid_metrics = utils.test(model, valid_loader, device, test_fmetrics)
        postprocess_metrics(test_fmetrics, valid_metrics)
        metrics_store["valid"].append(valid_metrics)

        # Save the model if it is better
        checkpoint_metric_name = "F1"
        checkpoint_metric = valid_metrics[checkpoint_metric_name]
        updated = model_checkpoint.update(checkpoint_metric)

        # Display the metrics
        metrics_msg = f" Epoch {e} / {num_epochs}\n"
        metrics_msg += "- Train : \n  "
        metrics_msg += "\n  ".join(
            f" {m_name}: {m_value}" for (m_name, m_value) in train_metrics.items()
        )
        metrics_msg += "\n"
        metrics_msg += "- Valid : \n  "
        metrics_msg += "\n  ".join(
            f" {m_name}: {m_value}"
            + ("[>> BETTER <<]" if updated and m_name == checkpoint_metric_name else "")
            for (m_name, m_value) in valid_metrics.items()
        )
        print(metrics_msg)

  0%|          | 0/1474 [00:00<?, ?it/s]

100%|██████████| 1474/1474 [01:21<00:00, 18.17it/s]
100%|██████████| 369/369 [00:20<00:00, 18.01it/s]
100%|██████████| 1474/1474 [04:38<00:00,  5.29it/s]
100%|██████████| 369/369 [00:20<00:00, 17.83it/s]

 Epoch 0 / 2
- Train : 
   focal: 0.05041743235933004
   accuracy: 0.9605594004834199
   confusion_matrix: [[0.9954146118281357, 0.004585388171864319], [0.5870692592258612, 0.41293074077413877]]
   F1: 0.5416884766447951
   precision: 0.7871255188568016
   recall: 0.41293074077413877
- Valid : 
   focal: 0.03458496961828569
   accuracy: 0.8642685112506758
   confusion_matrix: [[0.9850354573537219, 0.014964542646278133], [0.526730909307094, 0.473269090692906]]
   F1: 0.6034457223144885[>> BETTER <<]
   precision: 0.8324059615164311
   recall: 0.473269090692906

100%|██████████| 1474/1474 [04:33<00:00,  5.39it/s]
100%|██████████| 369/369 [00:20<00:00, 17.89it/s]

 Epoch 1 / 2
- Train : 
   focal: 0.01360388492515849
   accuracy: 0.960526061672692
   confusion_matrix: [[0.9962440705799295, 0.00375592942007056], [0.5190544495534446, 0.4809455504465554]]
   F1: 0.6117580025823954
   precision: 0.8403155563173192
   recall: 0.4809455504465554
- Valid : 
   focal: 0.017102164999813124
   accuracy: 0.8642685112506758
   confusion_matrix: [[0.9906546216510921, 0.009345378348907864], [0.48852997030393647, 0.5114700296960635]]
   F1: 0.6511491356972307[>> BETTER <<]
   precision: 0.8957810601232823
   recall: 0.5114700296960635

import matplotlib.pyplot as plt

plt.figure(figsize=(15,5), dpi=150)
plt.subplot(1, 4, 1)
plt.plot([mi["focal"] for mi in metrics_store["train"]], 'k-')
plt.plot([mi["focal"] for mi in metrics_store["valid"]], 'k--')
plt.title("Focal loss")
plt.xlabel("Epoch")

plt.subplot(1, 4, 2)
plt.plot([mi["F1"] for mi in metrics_store["train"]], 'k-')
plt.plot([mi["F1"] for mi in metrics_store["valid"]], 'k--')
plt.title("F1 score")
plt.xlabel("Epoch")

plt.subplot(1, 4, 3)
plt.plot([mi["precision"] for mi in metrics_store["train"]], 'k-')
plt.plot([mi["precision"] for mi in metrics_store["valid"]], 'k--')
plt.title("Precision")
plt.xlabel("Epoch")

plt.subplot(1, 4, 4)
plt.plot([mi["recall"] for mi in metrics_store["train"]], 'k-')
plt.plot([mi["recall"] for mi in metrics_store["valid"]], 'k--')
plt.title("Recall")
plt.xlabel("Epoch")

Text(0.5, 0, 'Epoch')

import pathlib
import matplotlib.pyplot as plt
import onnxruntime as ort
from PIL import Image
Image.MAX_IMAGE_PIXELS = 25000 * 15000
import numpy as np
import yaml

providers = []
use_cuda = True
patch_size = 4096

if use_cuda:
    providers.append("CUDAExecutionProvider")
providers.append("CPUExecutionProvider")

# You may adapt the following to either use 
# the model you trained  or the pretrained model you are provided
# logdir = pathlib.Path("pretrained_model")
logdir = pathlib.Path("logs")

inference_session = ort.InferenceSession(
    str(logdir / "best_model.onnx"), providers=providers
)

# Load our normalizing statistics
stats = yaml.safe_load(open(str(logdir / "normalizing_stats.yaml"), "r"))
mean = stats["mean"]
std = stats["std"]

# Load our image
scan_path = "./data/test/rg20210421_scan.png"
scan_img = np.array(Image.open(scan_path))

mask_path = "./data/test/rg20210421_mask.png"
mask_img = np.array(Image.open(mask_path))
print(mask_img.shape)

crop_offset = (5048, 2048)
# Normalize our input
scan_img = ((scan_img - mean * 255.)/(std * 255.)).astype(np.float32)
scan_img = scan_img[np.newaxis, np.newaxis, ...]
scan_img = scan_img[:, :, crop_offset[0]:(crop_offset[0] + patch_size), crop_offset[1]:(crop_offset[1] + patch_size)]

# Get the ground truth mask
# print(np.unique(mask_img))
mask_img = mask_img[crop_offset[0]:(crop_offset[0] + patch_size), crop_offset[1]:(crop_offset[1] + patch_size)] >= 8

# Perform an inference
logits = inference_session.run(None, {"scan": scan_img})[0]
probs = 1.0 / (1.0 + np.exp(-logits))

pred_mask = probs >= 0.5

# Plot the results
plt.figure(dpi=300)
plt.subplot(1, 4, 1)
plt.imshow(scan_img.squeeze(), cmap="gray")
plt.title("Zooscan image")
plt.axis("off")

plt.subplot(1, 4, 2)
plt.imshow(probs.squeeze(), interpolation="none", clim=(0.0, 1.0))
plt.title("Probabilities")
plt.axis("off")

plt.subplot(1, 4, 3)
plt.imshow(pred_mask.squeeze(), interpolation="none", cmap="tab20c")
plt.title("Predicted Mask")
plt.axis("off")

plt.subplot(1, 4, 4)
plt.imshow(mask_img, interpolation="none", cmap="tab20c")
plt.title("Ground truth")
plt.axis("off")

plt.tight_layout()

(14573, 22817)

%pip install segmentation_models_pytorch

Collecting segmentation_models_pytorch
  Downloading segmentation_models_pytorch-0.3.4-py3-none-any.whl (109 kB)
     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 109.5/109.5 KB 1.4 MB/s eta 0:00:00a 0:00:01
Collecting efficientnet-pytorch==0.7.1
  Downloading efficientnet_pytorch-0.7.1.tar.gz (21 kB)
  Preparing metadata (setup.py) ... done
Requirement already satisfied: huggingface-hub>=0.24.6 in ./venv/lib/python3.10/site-packages (from segmentation_models_pytorch) (0.25.1)
Collecting pretrainedmodels==0.7.4
  Downloading pretrainedmodels-0.7.4.tar.gz (58 kB)
     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 58.8/58.8 KB 1.6 MB/s eta 0:00:00
  Preparing metadata (setup.py) ... done
Requirement already satisfied: six in ./venv/lib/python3.10/site-packages (from segmentation_models_pytorch) (1.16.0)
Collecting timm==0.9.7
  Downloading timm-0.9.7-py3-none-any.whl (2.2 MB)
     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 2.2/2.2 MB 5.1 MB/s eta 0:00:00:00:0100:01
Requirement already satisfied: torchvision>=0.5.0 in ./venv/lib/python3.10/site-packages (from segmentation_models_pytorch) (0.19.1)
Requirement already satisfied: pillow in ./venv/lib/python3.10/site-packages (from segmentation_models_pytorch) (10.4.0)
Requirement already satisfied: tqdm in ./venv/lib/python3.10/site-packages (from segmentation_models_pytorch) (4.66.5)
Requirement already satisfied: torch in ./venv/lib/python3.10/site-packages (from efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (2.4.1)
Collecting munch
  Downloading munch-4.0.0-py2.py3-none-any.whl (9.9 kB)
Requirement already satisfied: safetensors in ./venv/lib/python3.10/site-packages (from timm==0.9.7->segmentation_models_pytorch) (0.4.5)
Requirement already satisfied: pyyaml in ./venv/lib/python3.10/site-packages (from timm==0.9.7->segmentation_models_pytorch) (6.0.2)
Requirement already satisfied: filelock in ./venv/lib/python3.10/site-packages (from huggingface-hub>=0.24.6->segmentation_models_pytorch) (3.16.1)
Requirement already satisfied: typing-extensions>=3.7.4.3 in ./venv/lib/python3.10/site-packages (from huggingface-hub>=0.24.6->segmentation_models_pytorch) (4.12.2)
Requirement already satisfied: packaging>=20.9 in ./venv/lib/python3.10/site-packages (from huggingface-hub>=0.24.6->segmentation_models_pytorch) (24.1)
Requirement already satisfied: fsspec>=2023.5.0 in ./venv/lib/python3.10/site-packages (from huggingface-hub>=0.24.6->segmentation_models_pytorch) (2024.9.0)
Requirement already satisfied: requests in ./venv/lib/python3.10/site-packages (from huggingface-hub>=0.24.6->segmentation_models_pytorch) (2.32.3)
Requirement already satisfied: numpy in ./venv/lib/python3.10/site-packages (from torchvision>=0.5.0->segmentation_models_pytorch) (2.1.1)
Requirement already satisfied: nvidia-cusparse-cu12==12.1.0.106 in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (12.1.0.106)
Requirement already satisfied: nvidia-nvtx-cu12==12.1.105 in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (12.1.105)
Requirement already satisfied: nvidia-curand-cu12==10.3.2.106 in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (10.3.2.106)
Requirement already satisfied: nvidia-cuda-nvrtc-cu12==12.1.105 in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (12.1.105)
Requirement already satisfied: jinja2 in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (3.1.4)
Requirement already satisfied: triton==3.0.0 in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (3.0.0)
Requirement already satisfied: sympy in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (1.13.3)
Requirement already satisfied: nvidia-cublas-cu12==12.1.3.1 in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (12.1.3.1)
Requirement already satisfied: nvidia-nccl-cu12==2.20.5 in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (2.20.5)
Requirement already satisfied: nvidia-cusolver-cu12==11.4.5.107 in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (11.4.5.107)
Requirement already satisfied: networkx in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (3.3)
Requirement already satisfied: nvidia-cuda-cupti-cu12==12.1.105 in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (12.1.105)
Requirement already satisfied: nvidia-cudnn-cu12==9.1.0.70 in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (9.1.0.70)
Requirement already satisfied: nvidia-cuda-runtime-cu12==12.1.105 in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (12.1.105)
Requirement already satisfied: nvidia-cufft-cu12==11.0.2.54 in ./venv/lib/python3.10/site-packages (from torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (11.0.2.54)
Requirement already satisfied: nvidia-nvjitlink-cu12 in ./venv/lib/python3.10/site-packages (from nvidia-cusolver-cu12==11.4.5.107->torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (12.6.77)
Requirement already satisfied: urllib3<3,>=1.21.1 in ./venv/lib/python3.10/site-packages (from requests->huggingface-hub>=0.24.6->segmentation_models_pytorch) (2.2.3)
Requirement already satisfied: certifi>=2017.4.17 in ./venv/lib/python3.10/site-packages (from requests->huggingface-hub>=0.24.6->segmentation_models_pytorch) (2024.8.30)
Requirement already satisfied: charset-normalizer<4,>=2 in ./venv/lib/python3.10/site-packages (from requests->huggingface-hub>=0.24.6->segmentation_models_pytorch) (3.3.2)
Requirement already satisfied: idna<4,>=2.5 in ./venv/lib/python3.10/site-packages (from requests->huggingface-hub>=0.24.6->segmentation_models_pytorch) (3.10)
Requirement already satisfied: MarkupSafe>=2.0 in ./venv/lib/python3.10/site-packages (from jinja2->torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (2.1.5)
Requirement already satisfied: mpmath<1.4,>=1.1.0 in ./venv/lib/python3.10/site-packages (from sympy->torch->efficientnet-pytorch==0.7.1->segmentation_models_pytorch) (1.3.0)
Using legacy 'setup.py install' for efficientnet-pytorch, since package 'wheel' is not installed.
Using legacy 'setup.py install' for pretrainedmodels, since package 'wheel' is not installed.
Installing collected packages: munch, efficientnet-pytorch, timm, pretrainedmodels, segmentation_models_pytorch
  Running setup.py install for efficientnet-pytorch ... done
  Attempting uninstall: timm
    Found existing installation: timm 1.0.9
    Uninstalling timm-1.0.9:
      Successfully uninstalled timm-1.0.9
  Running setup.py install for pretrainedmodels ... done
Successfully installed efficientnet-pytorch-0.7.1 munch-4.0.0 pretrainedmodels-0.7.4 segmentation_models_pytorch-0.3.4 timm-0.9.7
Note: you may need to restart the kernel to use updated packages.

import segmentation_models_pytorch as smp

model = smp.DeepLabV3Plus(
    encoder_name="resnet18", 
    encoder_weights="imagenet", 
    in_channels=1, 
    classes=1, 
)

dummy_input = torch.zeros(3, 1, 512, 512)
output = model(dummy_input)
print(f"The output has a shape {output.shape}")

Downloading: "https://download.pytorch.org/models/resnet18-5c106cde.pth" to /usr/users/dce-admin/fix/.cache/torch/hub/checkpoints/resnet18-5c106cde.pth
100%|██████████| 44.7M/44.7M [00:04<00:00, 11.7MB/s]

The output has a shape torch.Size([3, 1, 512, 512])

import wandb
wandb.init(project=..., entity=....)

Classe name	Count
background	903586894
Salpida	60370854
detritus	2242808
multiple<other	2142290
Calanoida	1914332
endostyle<Salpidae	1541269
badfocus<artefact	1336249
bubble	1302699
nucleus<Salpidae	1003932
Calanidae	835997
Chaetognatha	807700
juvenile<Salpida	701173
Euchaetidae	538480
part<Crustacea	485422
Centropagidae	468518
Candaciidae	462508
Corycaeidae	446955
fiber<detritus	366257
Eumalacostraca	333003
Rhopalonema velatum	324429
Metridinidae	313694
Gammaridea	310755
nectophore<Diphyidae	287985
Creseis acicula	285353
t001	260026
Flaccisagitta enflata	259964
othertocheck	259208
Chelophyes appendiculata	252368
Oikopleuridae	250231
Heterorhabdidae	227147
gonophore<Diphyidae	211023
part<Cnidaria	204616
nectophore<Physonectae	200246
Ostracoda	195320
Temoridae	180239
Oithonidae	158871
tail<Appendicularia	156565
Doliolida	156015
protozoea<Mysida	147630
bract<Diphyidae	114702
Acartiidae	112833
damaged<Aulacantha	109413
zoea<Galatheidae	107454
Cavolinia inflexa	101898
Hyperiidea	99523
calyptopsis<Euphausiacea	92612
Hydrozoa	88566
Aulacantha	72204
seaweed	70972
Sapphirinidae	69538
tail<Chaetognatha	69175
Gymnosomata	65518
egg<other	62427
Fritillariidae	62113
part<Mollusca	61776
Aglaura	53920
Annelida	53318
Creseidae	52541
like<Collodaria	52112
trunk<Appendicularia	50062
part<Siphonophorae	42509
eudoxie<Diphyidae	34491
Oncaeidae	29734
Limacinidae	28553
gonophore<Abylopsis tetragona	28054
egg<Actinopterygii	27244
zoea<Brachyura	25307
head<Chaetognatha	24456
bract<Abylopsis tetragona	23398
part<Thaliacea	23155
Insecta	22354
Actinopterygii	17853
colony<Phaeodaria	14070
artefact	13792
Penilia avirostris	13361
Harpacticoida	11465
t003	10630
pluteus<Ophiuroidea	10253
Collodaria	8803
larvae<Porcellanidae	8463
Podon	7855
egg<Mollusca	6938
pluteus<Echinoidea	5779
Globigerinidae	5704
Orbulina	5534
Evadne	5205
siphonula	3574
Rhizaria	2171
Neoceratium	2046

Classe name	Count
Non living	909119355
Living	78495098

ZooScan image segmentation using a UNet with a pretrained backbone¶

Introduction¶

Imports¶

Data loading and exploration¶

Dataset¶

Exploring the augmentation transforms¶

Adding the transforms in the data pipeline¶

Encoder/Decoder with a pretrained backbone¶

Experimenting with the encoder¶

Implementing the decoder¶

Building the complete model¶

Loss function and metrics for an unbalanced classification¶

Last elements : optimizer, early stopping, metrics, loggers, ...¶

Our first experiments¶

Inference on new zooscan images¶

Going further¶

Using DeepLab v3+ instead of the UNet with pretrained backbone¶

Interfacing with an online dashboard : wandb.ai¶

Running the code without jupyter¶