prototorch_models/prototorch/models/abstract.py

"""Abstract classes to be inherited by prototorch models."""

import pytorch_lightning as pl
import torch
import torchmetrics

from ..core.competitions import WTAC
from ..core.components import Components, LabeledComponents
from ..core.distances import euclidean_distance
from ..core.initializers import LabelsInitializer, ZerosCompInitializer
from ..core.pooling import stratified_min_pooling
from ..nn.wrappers import LambdaLayer


class ProtoTorchBolt(pl.LightningModule):
    """All ProtoTorch models are ProtoTorch Bolts."""

    def __init__(self, hparams, **kwargs):
        super().__init__()

        # Hyperparameters
        self.save_hyperparameters(hparams)

        # Default hparams
        self.hparams.setdefault("lr", 0.01)

        # Default config
        self.optimizer = kwargs.get("optimizer", torch.optim.Adam)
        self.lr_scheduler = kwargs.get("lr_scheduler", None)
        self.lr_scheduler_kwargs = kwargs.get("lr_scheduler_kwargs", dict())

    def configure_optimizers(self):
        optimizer = self.optimizer(self.parameters(), lr=self.hparams.lr)
        if self.lr_scheduler is not None:
            scheduler = self.lr_scheduler(optimizer,
                                          **self.lr_scheduler_kwargs)
            sch = {
                "scheduler": scheduler,
                "interval": "step",
            }  # called after each training step
            return [optimizer], [sch]
        else:
            return optimizer

    def reconfigure_optimizers(self):
        self.trainer.accelerator.setup_optimizers(self.trainer)

    def __repr__(self):
        surep = super().__repr__()
        indented = "".join([f"\t{line}\n" for line in surep.splitlines()])
        wrapped = f"ProtoTorch Bolt(\n{indented})"
        return wrapped


class PrototypeModel(ProtoTorchBolt):

    def __init__(self, hparams, **kwargs):
        super().__init__(hparams, **kwargs)

        distance_fn = kwargs.get("distance_fn", euclidean_distance)
        self.distance_layer = LambdaLayer(distance_fn)

    @property
    def num_prototypes(self):
        return len(self.proto_layer.components)

    @property
    def prototypes(self):
        return self.proto_layer.components.detach().cpu()

    @property
    def components(self):
        """Only an alias for the prototypes."""
        return self.prototypes

    def add_prototypes(self, *args, **kwargs):
        self.proto_layer.add_components(*args, **kwargs)
        self.hparams.distribution = self.proto_layer.distribution
        self.reconfigure_optimizers()

    def remove_prototypes(self, indices):
        self.proto_layer.remove_components(indices)
        self.hparams.distribution = self.proto_layer.distribution
        self.reconfigure_optimizers()


class UnsupervisedPrototypeModel(PrototypeModel):

    def __init__(self, hparams, **kwargs):
        super().__init__(hparams, **kwargs)

        # Layers
        prototypes_initializer = kwargs.get("prototypes_initializer", None)
        if prototypes_initializer is not None:
            self.proto_layer = Components(
                self.hparams.num_prototypes,
                initializer=prototypes_initializer,
            )

    def compute_distances(self, x):
        protos = self.proto_layer().type_as(x)
        distances = self.distance_layer(x, protos)
        return distances

    def forward(self, x):
        distances = self.compute_distances(x)
        return distances


class SupervisedPrototypeModel(PrototypeModel):

    def __init__(self, hparams, skip_proto_layer=False, **kwargs):
        super().__init__(hparams, **kwargs)

        # Layers
        distribution = hparams.get("distribution", None)
        prototypes_initializer = kwargs.get("prototypes_initializer", None)
        labels_initializer = kwargs.get("labels_initializer",
                                        LabelsInitializer())
        if not skip_proto_layer:
            # when subclasses do not need a customized prototype layer
            if prototypes_initializer is not None:
                # when building a new model
                self.proto_layer = LabeledComponents(
                    distribution=distribution,
                    components_initializer=prototypes_initializer,
                    labels_initializer=labels_initializer,
                )
                proto_shape = self.proto_layer.components.shape[1:]
                self.hparams.initialized_proto_shape = proto_shape
            else:
                # when restoring a checkpointed model
                self.proto_layer = LabeledComponents(
                    distribution=distribution,
                    components_initializer=ZerosCompInitializer(
                        self.hparams.initialized_proto_shape),
                )
        self.competition_layer = WTAC()

    @property
    def prototype_labels(self):
        return self.proto_layer.labels.detach().cpu()

    @property
    def num_classes(self):
        return self.proto_layer.num_classes

    def compute_distances(self, x):
        protos, _ = self.proto_layer()
        distances = self.distance_layer(x, protos)
        return distances

    def forward(self, x):
        distances = self.compute_distances(x)
        _, plabels = self.proto_layer()
        winning = stratified_min_pooling(distances, plabels)
        y_pred = torch.nn.functional.softmin(winning, dim=1)
        return y_pred

    def predict_from_distances(self, distances):
        with torch.no_grad():
            _, plabels = self.proto_layer()
            y_pred = self.competition_layer(distances, plabels)
        return y_pred

    def predict(self, x):
        with torch.no_grad():
            distances = self.compute_distances(x)
        y_pred = self.predict_from_distances(distances)
        return y_pred

    def log_acc(self, distances, targets, tag):
        preds = self.predict_from_distances(distances)
        accuracy = torchmetrics.functional.accuracy(preds.int(), targets.int())
        # `.int()` because FloatTensors are assumed to be class probabilities

        self.log(tag,
                 accuracy,
                 on_step=False,
                 on_epoch=True,
                 prog_bar=True,
                 logger=True)

    def test_step(self, batch, batch_idx):
        x, targets = batch

        preds = self.predict(x)
        accuracy = torchmetrics.functional.accuracy(preds.int(), targets.int())

        self.log("test_acc", accuracy)


class ProtoTorchMixin(object):
    """All mixins are ProtoTorchMixins."""


class NonGradientMixin(ProtoTorchMixin):
    """Mixin for custom non-gradient optimization."""

    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        self.automatic_optimization = False

    def training_step(self, train_batch, batch_idx, optimizer_idx=None):
        raise NotImplementedError


class ImagePrototypesMixin(ProtoTorchMixin):
    """Mixin for models with image prototypes."""

    def on_train_batch_end(self, outputs, batch, batch_idx, dataloader_idx):
        """Constrain the components to the range [0, 1] by clamping after updates."""
        self.proto_layer.components.data.clamp_(0.0, 1.0)

    def get_prototype_grid(self, num_columns=2, return_channels_last=True):
        from torchvision.utils import make_grid
        grid = make_grid(self.components, nrow=num_columns)
        if return_channels_last:
            grid = grid.permute((1, 2, 0))
        return grid.cpu()
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`"""Abstract classes to be inherited by prototorch models."""`

Add missing abstract.py file 2021-04-29 17:14:33 +00:00			`import pytorch_lightning as pl`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`import torch`
			`import torchmetrics`
Import from the newly cleaned-up prototorch namespace 2021-06-14 18:08:08 +00:00
			`from ..core.competitions import WTAC`
			`from ..core.components import Components, LabeledComponents`
			`from ..core.distances import euclidean_distance`
fix: update `hparams.distribution` as it changes during training 2022-02-02 20:53:03 +00:00			`from ..core.initializers import LabelsInitializer, ZerosCompInitializer`
Import from the newly cleaned-up prototorch namespace 2021-06-14 18:08:08 +00:00			`from ..core.pooling import stratified_min_pooling`
			`from ..nn.wrappers import LambdaLayer`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00

			`class ProtoTorchBolt(pl.LightningModule):`
Update SOM 2021-06-09 16:21:12 +00:00			`"""All ProtoTorch models are ProtoTorch Bolts."""`
ci: add github actions (#16) * chore: update pre-commit versions * ci: remove old configurations * ci: copy workflow from prototorch * ci: run precommit for all files * ci: add examples CPU test * ci(test): failing example test * ci: fix workflow definition * ci(test): repeat failing example test * ci: fix workflow definition * ci(test): repeat failing example test II * ci: fix test command * ci: cleanup example test * ci: remove travis badge 2022-01-11 17:28:50 +00:00
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`def __init__(self, hparams, **kwargs):`
			`super().__init__()`

			`# Hyperparameters`
			`self.save_hyperparameters(hparams)`

			`# Default hparams`
			`self.hparams.setdefault("lr", 0.01)`

			`# Default config`
			`self.optimizer = kwargs.get("optimizer", torch.optim.Adam)`
			`self.lr_scheduler = kwargs.get("lr_scheduler", None)`
			`self.lr_scheduler_kwargs = kwargs.get("lr_scheduler_kwargs", dict())`
Add missing abstract.py file 2021-04-29 17:14:33 +00:00
			`def configure_optimizers(self):`
Change optimizer using kwargs 2021-05-11 14:13:00 +00:00			`optimizer = self.optimizer(self.parameters(), lr=self.hparams.lr)`
No implicit learning rate scheduling 2021-06-04 13:55:06 +00:00			`if self.lr_scheduler is not None:`
			`scheduler = self.lr_scheduler(optimizer,`
			`**self.lr_scheduler_kwargs)`
			`sch = {`
			`"scheduler": scheduler,`
			`"interval": "step",`
			`} # called after each training step`
			`return [optimizer], [sch]`
			`else:`
			`return optimizer`
Stop passing component initializers as hparams Pass the component initializer as an hparam slows down the script very much. The API has now been changed to pass it as a kwarg to the models instead. The example scripts have also been updated to reflect the new changes. Also, ImageGMLVQ and an example script `gmlvq_mnist.py` that uses it have also been added. 2021-05-12 14:36:22 +00:00
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`def reconfigure_optimizers(self):`
fix: remove deprecated `Trainer.accelerator_backend` 2021-06-30 14:03:45 +00:00			`self.trainer.accelerator.setup_optimizers(self.trainer)`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00
refactor: clean up abstract classes 2021-07-14 17:17:05 +00:00			`def __repr__(self):`
			`surep = super().__repr__()`
			`indented = "".join([f"\t{line}\n" for line in surep.splitlines()])`
			`wrapped = f"ProtoTorch Bolt(\n{indented})"`
			`return wrapped`


			`class PrototypeModel(ProtoTorchBolt):`
ci: add github actions (#16) * chore: update pre-commit versions * ci: remove old configurations * ci: copy workflow from prototorch * ci: run precommit for all files * ci: add examples CPU test * ci(test): failing example test * ci: fix workflow definition * ci(test): repeat failing example test * ci: fix workflow definition * ci(test): repeat failing example test II * ci: fix test command * ci: cleanup example test * ci: remove travis badge 2022-01-11 17:28:50 +00:00
refactor: clean up abstract classes 2021-07-14 17:17:05 +00:00			`def __init__(self, hparams, **kwargs):`
			`super().__init__(hparams, **kwargs)`

			`distance_fn = kwargs.get("distance_fn", euclidean_distance)`
			`self.distance_layer = LambdaLayer(distance_fn)`

			`@property`
			`def num_prototypes(self):`
			`return len(self.proto_layer.components)`

			`@property`
			`def prototypes(self):`
			`return self.proto_layer.components.detach().cpu()`

			`@property`
			`def components(self):`
			`"""Only an alias for the prototypes."""`
			`return self.prototypes`

[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`def add_prototypes(self, args, *kwargs):`
			`self.proto_layer.add_components(args, *kwargs)`
fix: update `hparams.distribution` as it changes during training 2022-02-02 20:53:03 +00:00			`self.hparams.distribution = self.proto_layer.distribution`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`self.reconfigure_optimizers()`

			`def remove_prototypes(self, indices):`
			`self.proto_layer.remove_components(indices)`
fix: update `hparams.distribution` as it changes during training 2022-02-02 20:53:03 +00:00			`self.hparams.distribution = self.proto_layer.distribution`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`self.reconfigure_optimizers()`


			`class UnsupervisedPrototypeModel(PrototypeModel):`
ci: add github actions (#16) * chore: update pre-commit versions * ci: remove old configurations * ci: copy workflow from prototorch * ci: run precommit for all files * ci: add examples CPU test * ci(test): failing example test * ci: fix workflow definition * ci(test): repeat failing example test * ci: fix workflow definition * ci(test): repeat failing example test II * ci: fix test command * ci: cleanup example test * ci: remove travis badge 2022-01-11 17:28:50 +00:00
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`def __init__(self, hparams, **kwargs):`
			`super().__init__(hparams, **kwargs)`

			`# Layers`
[BUGFIX] KNN works again 2021-06-14 18:09:41 +00:00			`prototypes_initializer = kwargs.get("prototypes_initializer", None)`
			`if prototypes_initializer is not None:`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`self.proto_layer = Components(`
			`self.hparams.num_prototypes,`
[BUGFIX] KNN works again 2021-06-14 18:09:41 +00:00			`initializer=prototypes_initializer,`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`)`

			`def compute_distances(self, x):`
fix: All examples should work on CPU and GPU now 2021-08-05 09:20:02 +00:00			`protos = self.proto_layer().type_as(x)`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`distances = self.distance_layer(x, protos)`
			`return distances`

			`def forward(self, x):`
			`distances = self.compute_distances(x)`
			`return distances`


			`class SupervisedPrototypeModel(PrototypeModel):`
ci: add github actions (#16) * chore: update pre-commit versions * ci: remove old configurations * ci: copy workflow from prototorch * ci: run precommit for all files * ci: add examples CPU test * ci(test): failing example test * ci: fix workflow definition * ci(test): repeat failing example test * ci: fix workflow definition * ci(test): repeat failing example test II * ci: fix test command * ci: cleanup example test * ci: remove travis badge 2022-01-11 17:28:50 +00:00
fix: CBC example works again 2022-03-30 13:10:06 +00:00			`def __init__(self, hparams, skip_proto_layer=False, **kwargs):`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`super().__init__(hparams, **kwargs)`

			`# Layers`
fix: CBC example works again 2022-03-30 13:10:06 +00:00			`distribution = hparams.get("distribution", None)`
[BUGFIX] KNN works again 2021-06-14 18:09:41 +00:00			`prototypes_initializer = kwargs.get("prototypes_initializer", None)`
[FEATURE] Add warm-starting example 2021-06-14 18:42:57 +00:00			`labels_initializer = kwargs.get("labels_initializer",`
			`LabelsInitializer())`
fix: CBC example works again 2022-03-30 13:10:06 +00:00			`if not skip_proto_layer:`
			`# when subclasses do not need a customized prototype layer`
			`if prototypes_initializer is not None:`
			`# when building a new model`
			`self.proto_layer = LabeledComponents(`
			`distribution=distribution,`
			`components_initializer=prototypes_initializer,`
			`labels_initializer=labels_initializer,`
			`)`
			`proto_shape = self.proto_layer.components.shape[1:]`
			`self.hparams.initialized_proto_shape = proto_shape`
			`else:`
			`# when restoring a checkpointed model`
			`self.proto_layer = LabeledComponents(`
			`distribution=distribution,`
			`components_initializer=ZerosCompInitializer(`
			`self.hparams.initialized_proto_shape),`
			`)`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`self.competition_layer = WTAC()`

			`@property`
			`def prototype_labels(self):`
[BUGFIX] KNN works again 2021-06-14 18:09:41 +00:00			`return self.proto_layer.labels.detach().cpu()`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00
			`@property`
			`def num_classes(self):`
[BUGFIX] `examples/cbc_iris.py` works again 2021-06-15 13:59:47 +00:00			`return self.proto_layer.num_classes`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00
			`def compute_distances(self, x):`
			`protos, _ = self.proto_layer()`
			`distances = self.distance_layer(x, protos)`
			`return distances`

			`def forward(self, x):`
			`distances = self.compute_distances(x)`
fix: labels where on cpu in forward pass 2021-08-05 07:14:32 +00:00			`_, plabels = self.proto_layer()`
[BUGFIX] KNN works again 2021-06-14 18:09:41 +00:00			`winning = stratified_min_pooling(distances, plabels)`
fix(warning): specify dimension explicitly when calling `softmin` 2021-11-16 09:19:31 +00:00			`y_pred = torch.nn.functional.softmin(winning, dim=1)`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`return y_pred`

			`def predict_from_distances(self, distances):`
			`with torch.no_grad():`
fix: labels where on cpu in forward pass 2021-08-05 07:14:32 +00:00			`_, plabels = self.proto_layer()`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`y_pred = self.competition_layer(distances, plabels)`
			`return y_pred`

			`def predict(self, x):`
			`with torch.no_grad():`
			`distances = self.compute_distances(x)`
			`y_pred = self.predict_from_distances(distances)`
			`return y_pred`

			`def log_acc(self, distances, targets, tag):`
			`preds = self.predict_from_distances(distances)`
			`accuracy = torchmetrics.functional.accuracy(preds.int(), targets.int())`
			# `.int()` because FloatTensors are assumed to be class probabilities

			`self.log(tag,`
			`accuracy,`
			`on_step=False,`
			`on_epoch=True,`
			`prog_bar=True,`
			`logger=True)`
feat: add simple test step 2021-09-10 17:19:51 +00:00
			`def test_step(self, batch, batch_idx):`
			`x, targets = batch`

			`preds = self.predict(x)`
			`accuracy = torchmetrics.functional.accuracy(preds.int(), targets.int())`

			`self.log("test_acc", accuracy)`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00

refactor: clean up abstract classes 2021-07-14 17:17:05 +00:00			`class ProtoTorchMixin(object):`
			`"""All mixins are ProtoTorchMixins."""`


Update SOM 2021-06-09 16:21:12 +00:00			`class NonGradientMixin(ProtoTorchMixin):`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`"""Mixin for custom non-gradient optimization."""`
ci: add github actions (#16) * chore: update pre-commit versions * ci: remove old configurations * ci: copy workflow from prototorch * ci: run precommit for all files * ci: add examples CPU test * ci(test): failing example test * ci: fix workflow definition * ci(test): repeat failing example test * ci: fix workflow definition * ci(test): repeat failing example test II * ci: fix test command * ci: cleanup example test * ci: remove travis badge 2022-01-11 17:28:50 +00:00
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`def __init__(self, args, *kwargs):`
			`super().__init__(args, *kwargs)`
feat(compatibility): Python3.6 compatibility 2021-08-30 15:15:40 +00:00			`self.automatic_optimization = False`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00
			`def training_step(self, train_batch, batch_idx, optimizer_idx=None):`
			`raise NotImplementedError`

Stop passing component initializers as hparams Pass the component initializer as an hparam slows down the script very much. The API has now been changed to pass it as a kwarg to the models instead. The example scripts have also been updated to reflect the new changes. Also, ImageGMLVQ and an example script `gmlvq_mnist.py` that uses it have also been added. 2021-05-12 14:36:22 +00:00
Update SOM 2021-06-09 16:21:12 +00:00			`class ImagePrototypesMixin(ProtoTorchMixin):`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`"""Mixin for models with image prototypes."""`
ci: add github actions (#16) * chore: update pre-commit versions * ci: remove old configurations * ci: copy workflow from prototorch * ci: run precommit for all files * ci: add examples CPU test * ci(test): failing example test * ci: fix workflow definition * ci(test): repeat failing example test * ci: fix workflow definition * ci(test): repeat failing example test II * ci: fix test command * ci: cleanup example test * ci: remove travis badge 2022-01-11 17:28:50 +00:00
Stop passing component initializers as hparams Pass the component initializer as an hparam slows down the script very much. The API has now been changed to pass it as a kwarg to the models instead. The example scripts have also been updated to reflect the new changes. Also, ImageGMLVQ and an example script `gmlvq_mnist.py` that uses it have also been added. 2021-05-12 14:36:22 +00:00			`def on_train_batch_end(self, outputs, batch, batch_idx, dataloader_idx):`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`"""Constrain the components to the range [0, 1] by clamping after updates."""`
Stop passing component initializers as hparams Pass the component initializer as an hparam slows down the script very much. The API has now been changed to pass it as a kwarg to the models instead. The example scripts have also been updated to reflect the new changes. Also, ImageGMLVQ and an example script `gmlvq_mnist.py` that uses it have also been added. 2021-05-12 14:36:22 +00:00			`self.proto_layer.components.data.clamp_(0.0, 1.0)`
Cleanup models Siamese architectures no longer accept a `backbone_module`. They have to be initialized with an pre-initialized backbone object instead. This is so that the visualization callbacks could use the very same object for visualization purposes. Also, there's no longer a dependent copy of the backbone. It is managed simply with `requires_grad` instead. 2021-05-17 15:00:23 +00:00
Use 'num_' in all variable names 2021-05-25 13:41:10 +00:00			`def get_prototype_grid(self, num_columns=2, return_channels_last=True):`
Add get_prototype_grid method 2021-05-21 11:11:48 +00:00			`from torchvision.utils import make_grid`
Use 'num_' in all variable names 2021-05-25 13:41:10 +00:00			`grid = make_grid(self.components, nrow=num_columns)`
Add get_prototype_grid method 2021-05-21 11:11:48 +00:00			`if return_channels_last:`
			`grid = grid.permute((1, 2, 0))`
			`return grid.cpu()`