Source code for towbintools.deep_learning.architectures.models

import pytorch_lightning as pl
import segmentation_models_pytorch as smp
import timm
import torch
import torch.nn as nn
from torchmetrics.classification import BinaryF1Score
from torchmetrics.classification import MulticlassF1Score

from .archs import AttentionUnet1D
from .archs import Unet1D
from .archs import UnetPlusPlus1D
from towbintools.deep_learning.utils.loss import FocalTverskyLoss
from towbintools.deep_learning.utils.loss import MultiClassFocalLoss
from towbintools.deep_learning.utils.loss import PeakWeightedMSELoss



[docs]
class ClassificationModel(pl.LightningModule):
    """
    PyTorch Lightning module for image classification using a pretrained backbone.

    Uses ``timm`` to load the specified architecture with ImageNet-pretrained weights.
    Applies ``BCEWithLogitsLoss`` + ``BinaryF1Score`` for binary tasks, or
    ``CrossEntropyLoss`` + ``MulticlassF1Score`` for multiclass tasks.

    Parameters:
        architecture (str): ``timm`` model name (e.g. ``"efficientnet_b0"``).
        input_channels (int): Number of input image channels.
        classes (list[str]): Class labels; ``len(classes)`` determines binary vs multiclass.
        learning_rate (float): Learning rate for the Adam optimizer.
        normalization (dict): Normalization config stored as a hyperparameter and
            used at inference time to reconstruct the preprocessing pipeline.
    """

    def __init__(
        self,
        architecture,
        input_channels,
        classes,
        learning_rate,
        normalization,
    ):
        super().__init__()
        n_classes = len(classes)
        if n_classes == 2:
            self.activation = nn.Sigmoid()
        else:
            self.activation = nn.Softmax(dim=1)

        model = timm.create_model(
            architecture,
            pretrained=True,
            num_classes=n_classes,
            in_chans=input_channels,
        )

        self.model = model
        self.learning_rate = learning_rate
        self.classes = classes
        self.n_classes = n_classes
        if n_classes == 2:
            self.criterion = nn.BCEWithLogitsLoss()
            self.f1_score = BinaryF1Score()
        else:
            self.criterion = nn.CrossEntropyLoss()
            self.f1_score = MulticlassF1Score(num_classes=n_classes)

        self.normalization = normalization
        self.save_hyperparameters()


[docs]
    def forward(self, x):
        y = self.model(x)
        return self.activation(y)



[docs]
    def log_tb_images(self, viz_batch) -> None:
        # Get tensorboard logger
        tb_logger = None
        for logger in self.trainer.loggers:
            if isinstance(logger, pl.loggers.TensorBoardLogger):
                tb_logger = logger.experiment
                break

        if tb_logger is None:
            raise ValueError("TensorBoard Logger not found")



[docs]
    def training_step(self, batch):
        if batch is None:
            return None
        x, y = batch
        y_hat = self.model(x)
        if y_hat.dim() == 0:
            y_hat = y_hat.unsqueeze(0)

        loss = self.criterion(y_hat, y)
        self.log(
            "train_loss",
            loss,
            on_step=False,
            on_epoch=True,
            prog_bar=True,
            logger=True,
            sync_dist=True,
        )

        y_hat = self.activation(y_hat)

        if self.n_classes > 2:
            y_hat = torch.argmax(y_hat, dim=1)

        f1_score = self.f1_score(y_hat, y)
        self.log(
            "train_f1_score",
            f1_score,
            on_step=False,
            on_epoch=True,
            logger=True,
            sync_dist=True,
        )

        return loss



[docs]
    def validation_step(self, batch):
        if batch is None:
            return None
        x, y = batch
        y_hat = self.model(x)
        if y_hat.dim() == 0:
            y_hat = y_hat.unsqueeze(0)

        loss = self.criterion(y_hat, y)
        self.log(
            "val_loss",
            loss,
            on_step=False,
            on_epoch=True,
            prog_bar=True,
            logger=True,
            sync_dist=True,
        )

        y_hat = self.activation(y_hat)

        if self.n_classes > 2:
            y_hat = torch.argmax(y_hat, dim=1)

        f1_score = self.f1_score(y_hat, y)
        self.log(
            "val_f1_score",
            f1_score,
            on_step=False,
            on_epoch=True,
            prog_bar=True,
            logger=True,
            sync_dist=True,
        )



[docs]
    def configure_optimizers(self):
        optimizer = torch.optim.Adam(self.parameters(), lr=self.learning_rate)
        return optimizer





[docs]
class SegmentationModel(pl.LightningModule):
    """
    PyTorch Lightning module for image segmentation using a pretrained encoder.

    Uses ``segmentation_models_pytorch`` to build an encoder–decoder model.
    For binary tasks (``n_classes == 1``): sigmoid activation +
    ``FocalTverskyLoss`` + ``BinaryF1Score``. For multiclass tasks:
    softmax activation + ``MultiClassFocalLoss`` + ``MulticlassF1Score``.

    Parameters:
        input_channels (int): Number of input image channels.
        n_classes (int): Number of foreground segmentation classes.
        learning_rate (float): Learning rate for the Adam optimizer.
        architecture (str): ``smp`` architecture name (e.g. ``"Unet"``).
        encoder (str): Encoder backbone name (e.g. ``"resnet34"``).
        pretrained_weights (str): Dataset the encoder was pretrained on
            (e.g. ``"imagenet"``).
        normalization (dict): Normalization config stored as a hyperparameter
            and used at inference time to reconstruct the preprocessing pipeline.
        criterion (nn.Module, optional): Loss function. If ``None``,
            ``FocalTverskyLoss`` is used for binary tasks and
            ``MultiClassFocalLoss`` for multiclass. (default: None)
        ignore_index (int, optional): Target value to ignore in the loss and
            F1 score. (default: None)
    """

    def __init__(
        self,
        input_channels,
        n_classes,
        learning_rate,
        architecture,
        encoder,
        pretrained_weights,
        normalization,
        criterion=None,
        ignore_index=None,
    ):
        super().__init__()
        if n_classes == 1:
            self.activation = nn.Sigmoid()
        else:
            self.activation = nn.Softmax(dim=1)

        model = smp.create_model(
            arch=architecture,
            encoder_name=encoder,
            encoder_weights=pretrained_weights,
            in_channels=input_channels,
            classes=n_classes + 1 if n_classes > 1 else n_classes,
            activation=None,
        )

        self.model = model
        self.learning_rate = learning_rate
        self.ignore_index = ignore_index

        if criterion is None:
            if n_classes == 1:
                self.criterion = FocalTverskyLoss(ignore_index=self.ignore_index)
            else:
                self.criterion = MultiClassFocalLoss(
                    ignore_index=self.ignore_index,
                    alpha=torch.tensor([0.1] + [0.75] * n_classes),
                )
        else:
            self.criterion = criterion

        if n_classes == 1:
            self.f1_score = BinaryF1Score(ignore_index=self.criterion.ignore_index)
        else:
            self.f1_score = MulticlassF1Score(
                num_classes=n_classes + 1,
                ignore_index=self.criterion.ignore_index,
            )

        self.normalization = normalization
        self.save_hyperparameters(ignore=["criterion"])
        self.n_classes = n_classes


[docs]
    def forward(self, x):
        y = self.model(x)
        return self.activation(y)



[docs]
    def training_step(self, batch):
        x, y = batch
        y_hat = self.model(x)
        loss = self.criterion(y_hat, y)
        self.log(
            "train_loss",
            loss,
            on_step=False,
            on_epoch=True,
            prog_bar=True,
            logger=True,
            sync_dist=True,
        )

        y_hat = self.activation(y_hat)
        if self.n_classes > 1 and y.dim() == 4 and y.shape[1] == 1:
            y = y.squeeze(1)

        f1_score = self.f1_score(y_hat, y)
        self.log(
            "train_f1_score",
            f1_score,
            on_step=False,
            on_epoch=True,
            logger=True,
            sync_dist=True,
        )

        return loss



[docs]
    def validation_step(self, batch):
        x, y = batch
        y_hat = self.model(x)
        loss = self.criterion(y_hat, y)
        self.log(
            "val_loss",
            loss,
            on_step=False,
            on_epoch=True,
            prog_bar=True,
            logger=True,
            sync_dist=True,
        )

        y_hat = self.activation(y_hat)
        if self.n_classes > 1 and y.dim() == 4 and y.shape[1] == 1:
            y = y.squeeze(1)

        f1_score = self.f1_score(y_hat, y)
        self.log(
            "val_f1_score",
            f1_score,
            on_step=False,
            on_epoch=True,
            logger=True,
            prog_bar=True,
            sync_dist=True,
        )



[docs]
    def predict_step(self, batch):
        x = batch

        pred = self.forward(x)

        # binarize predictions
        if self.n_classes == 1:
            pred = pred > 0.5
        else:
            pred = torch.argmax(pred, dim=1)

        return pred



[docs]
    def configure_optimizers(self):
        optimizer = torch.optim.Adam(self.parameters(), lr=self.learning_rate)
        return optimizer





[docs]
class KeypointDetection1DModel(pl.LightningModule):
    """
    PyTorch Lightning module for 1D keypoint detection using a U-Net architecture.

    Operates on 1D sequences (e.g. straightened worm fluorescence profiles).
    Supports ``"Unet"``, ``"AttentionUnet"``, and ``"UnetPlusPlus"`` 1D
    architectures. Uses ``PeakWeightedMSELoss`` by default.

    Parameters:
        input_channels (int): Number of input sequence channels.
        n_classes (int): Number of keypoint classes (output channels).
        learning_rate (float): Learning rate for the Adam optimizer.
        architecture (str, optional): Architecture name; one of ``"Unet"``,
            ``"AttentionUnet"``, or ``"UnetPlusPlus"``. (default: ``"UnetPlusPlus"``)
        activation (str, optional): Output activation; one of ``"relu"``,
            ``"leaky_relu"``, ``"sigmoid"``, or ``"none"``. (default: ``"sigmoid"``)
        criterion (nn.Module, optional): Loss function. If ``None``,
            ``PeakWeightedMSELoss`` is used. (default: None)

    Raises:
        ValueError: If ``architecture`` or ``activation`` is not supported.
    """

    def __init__(
        self,
        input_channels,
        n_classes,
        learning_rate,
        architecture="UnetPlusPlus",
        activation="sigmoid",
        criterion=None,
    ):
        super().__init__()

        if architecture == "Unet":
            model = Unet1D(num_classes=n_classes, input_channels=input_channels)
        elif architecture == "AttentionUnet":
            model = AttentionUnet1D(
                num_classes=n_classes, input_channels=input_channels
            )
        elif architecture == "UnetPlusPlus":
            model = UnetPlusPlus1D(num_classes=n_classes, input_channels=input_channels)
        else:
            raise ValueError(f"Unsupported architecture: {architecture}")

        self.model = model
        self.learning_rate = learning_rate

        # Set a default ignore_index if not present
        if not hasattr(self, "ignore_index"):
            self.ignore_index = -100

        if criterion is None:
            self.criterion = PeakWeightedMSELoss()

        else:
            self.criterion = criterion

        if activation == "relu":
            self.activation = nn.ReLU(inplace=True)
        elif activation == "leaky_relu":
            self.activation = nn.LeakyReLU(inplace=True)
        elif activation == "sigmoid":
            self.activation = nn.Sigmoid()
        elif activation == "none":
            self.activation = nn.Identity()
        else:
            raise ValueError(f"Unsupported activation function: {activation}")

        self.save_hyperparameters()


[docs]
    def forward(self, x):
        y = self.model(x)
        return self.activation(y)



[docs]
    def training_step(self, batch):
        x, y = batch
        y_hat = self.model(x)
        y_hat = self.activation(y_hat)
        loss = self.criterion(y_hat, y)
        self.log(
            "train_loss",
            loss,
            on_step=False,
            on_epoch=True,
            prog_bar=True,
            logger=True,
            sync_dist=True,
        )
        return loss



[docs]
    def validation_step(self, batch):
        x, y = batch
        y_hat = self.model(x)
        y_hat = self.activation(y_hat)
        loss = self.criterion(y_hat, y)
        self.log(
            "val_loss",
            loss,
            on_step=False,
            on_epoch=True,
            prog_bar=True,
            logger=True,
            sync_dist=True,
        )



[docs]
    def predict_step(self, batch):
        x = batch
        pred = self.model(x)
        return pred



[docs]
    def configure_optimizers(self):
        optimizer = torch.optim.Adam(self.parameters(), lr=self.learning_rate)
        return optimizer