prototorch_models/prototorch/models/unsupervised.py

"""Unsupervised prototype learning algorithms."""

import numpy as np
import torch
from prototorch.core.competitions import wtac
from prototorch.core.distances import squared_euclidean_distance
from prototorch.core.losses import NeuralGasEnergy
from prototorch.nn.wrappers import LambdaLayer

from .abstract import UnsupervisedPrototypeModel
from .callbacks import GNGCallback
from .extras import ConnectionTopology
from .mixin import NonGradientMixin


class KohonenSOM(NonGradientMixin, UnsupervisedPrototypeModel):
    """Kohonen Self-Organizing-Map.

    TODO Allow non-2D grids

    """
    def __init__(self, hparams, **kwargs):
        h, w = hparams.get("shape")
        # Ignore `num_prototypes`
        hparams["num_prototypes"] = h * w
        distance_fn = kwargs.pop("distance_fn", squared_euclidean_distance)
        super().__init__(hparams, distance_fn=distance_fn, **kwargs)

        # Hyperparameters
        self.save_hyperparameters(hparams)

        # Default hparams
        self.hparams.setdefault("alpha", 0.3)
        self.hparams.setdefault("sigma", max(h, w) / 2.0)

        # Additional parameters
        x, y = torch.arange(h), torch.arange(w)
        grid = torch.stack(torch.meshgrid(x, y), dim=-1)
        self.register_buffer("_grid", grid)
        self._sigma = self.hparams.sigma
        self._lr = self.hparams.lr

    def predict_from_distances(self, distances):
        grid = self._grid.view(-1, 2)
        wp = wtac(distances, grid)
        return wp

    def training_step(self, train_batch, batch_idx):
        # x = train_batch
        # TODO Check if the batch has labels
        x = train_batch[0]
        d = self.compute_distances(x)
        wp = self.predict_from_distances(d)
        grid = self._grid.view(-1, 2)
        gd = squared_euclidean_distance(wp, grid)
        nh = torch.exp(-gd / self._sigma**2)
        protos = self.proto_layer()
        diff = x.unsqueeze(dim=1) - protos
        delta = self._lr * self.hparams.alpha * nh.unsqueeze(-1) * diff
        updated_protos = protos + delta.sum(dim=0)
        self.proto_layer.load_state_dict({"_components": updated_protos},
                                         strict=False)

    def training_epoch_end(self, training_step_outputs):
        self._sigma = self.hparams.sigma * np.exp(
            -self.current_epoch / self.trainer.max_epochs)

    def extra_repr(self):
        return f"(grid): (shape: {tuple(self._grid.shape)})"


class HeskesSOM(UnsupervisedPrototypeModel):
    def __init__(self, hparams, **kwargs):
        super().__init__(hparams, **kwargs)

    def training_step(self, train_batch, batch_idx):
        # TODO Implement me!
        raise NotImplementedError()


class NeuralGas(UnsupervisedPrototypeModel):
    def __init__(self, hparams, **kwargs):
        super().__init__(hparams, **kwargs)

        # Hyperparameters
        self.save_hyperparameters(hparams)

        # Default hparams
        self.hparams.setdefault("agelimit", 10)
        self.hparams.setdefault("lm", 1)

        self.energy_layer = NeuralGasEnergy(lm=self.hparams.lm)
        self.topology_layer = ConnectionTopology(
            agelimit=self.hparams.agelimit,
            num_prototypes=self.hparams.num_prototypes,
        )

    def training_step(self, train_batch, batch_idx):
        # x = train_batch
        # TODO Check if the batch has labels
        x = train_batch[0]
        d = self.compute_distances(x)
        loss, _ = self.energy_layer(d)
        self.topology_layer(d)
        self.log("loss", loss)
        return loss

    # def training_epoch_end(self, training_step_outputs):
    #     print(f"{self.trainer.lr_schedulers}")
    #     print(f"{self.trainer.lr_schedulers[0]['scheduler'].optimizer}")


class GrowingNeuralGas(NeuralGas):
    def __init__(self, hparams, **kwargs):
        super().__init__(hparams, **kwargs)

        # Defaults
        self.hparams.setdefault("step_reduction", 0.5)
        self.hparams.setdefault("insert_reduction", 0.1)
        self.hparams.setdefault("insert_freq", 10)

        errors = torch.zeros(self.hparams.num_prototypes, device=self.device)
        self.register_buffer("errors", errors)

    def training_step(self, train_batch, _batch_idx):
        # x = train_batch
        # TODO Check if the batch has labels
        x = train_batch[0]
        d = self.compute_distances(x)
        loss, order = self.energy_layer(d)
        winner = order[:, 0]
        mask = torch.zeros_like(d)
        mask[torch.arange(len(mask)), winner] = 1.0
        dp = d * mask

        self.errors += torch.sum(dp * dp)
        self.errors *= self.hparams.step_reduction

        self.topology_layer(d)
        self.log("loss", loss)
        return loss

    def configure_callbacks(self):
        return [
            GNGCallback(reduction=self.hparams.insert_reduction,
                        freq=self.hparams.insert_freq)
        ]
Update Documentation Clean up project 2021-05-21 13:42:45 +00:00			`"""Unsupervised prototype learning algorithms."""`

Update SOM 2021-06-09 16:21:12 +00:00			`import numpy as np`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00			`import torch`
chore: Remove relative imports 2021-10-11 13:45:43 +00:00			`from prototorch.core.competitions import wtac`
			`from prototorch.core.distances import squared_euclidean_distance`
			`from prototorch.core.losses import NeuralGasEnergy`
			`from prototorch.nn.wrappers import LambdaLayer`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00
chore: Move mixins into seperate file 2021-10-11 14:05:12 +00:00			`from .abstract import UnsupervisedPrototypeModel`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`from .callbacks import GNGCallback`
			`from .extras import ConnectionTopology`
chore: Move mixins into seperate file 2021-10-11 14:05:12 +00:00			`from .mixin import NonGradientMixin`
Use Components instead of Prototypes and refactor old examples 2021-04-29 15:05:41 +00:00
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00
[WIP] Add SOM 2021-06-07 16:44:15 +00:00			`class KohonenSOM(NonGradientMixin, UnsupervisedPrototypeModel):`
			`"""Kohonen Self-Organizing-Map.`

			`TODO Allow non-2D grids`

			`"""`
			`def __init__(self, hparams, **kwargs):`
			`h, w = hparams.get("shape")`
			# Ignore `num_prototypes`
			`hparams["num_prototypes"] = h * w`
			`distance_fn = kwargs.pop("distance_fn", squared_euclidean_distance)`
			`super().__init__(hparams, distance_fn=distance_fn, **kwargs)`

			`# Hyperparameters`
			`self.save_hyperparameters(hparams)`

			`# Default hparams`
			`self.hparams.setdefault("alpha", 0.3)`
			`self.hparams.setdefault("sigma", max(h, w) / 2.0)`

			`# Additional parameters`
			`x, y = torch.arange(h), torch.arange(w)`
			`grid = torch.stack(torch.meshgrid(x, y), dim=-1)`
			`self.register_buffer("_grid", grid)`
Update SOM 2021-06-09 16:21:12 +00:00			`self._sigma = self.hparams.sigma`
			`self._lr = self.hparams.lr`
[WIP] Add SOM 2021-06-07 16:44:15 +00:00
			`def predict_from_distances(self, distances):`
			`grid = self._grid.view(-1, 2)`
			`wp = wtac(distances, grid)`
			`return wp`

			`def training_step(self, train_batch, batch_idx):`
			`# x = train_batch`
			`# TODO Check if the batch has labels`
			`x = train_batch[0]`
			`d = self.compute_distances(x)`
			`wp = self.predict_from_distances(d)`
			`grid = self._grid.view(-1, 2)`
			`gd = squared_euclidean_distance(wp, grid)`
Update SOM 2021-06-09 16:21:12 +00:00			`nh = torch.exp(-gd / self._sigma**2)`
fix: All examples should work on CPU and GPU now 2021-08-05 09:20:02 +00:00			`protos = self.proto_layer()`
[WIP] Add SOM 2021-06-07 16:44:15 +00:00			`diff = x.unsqueeze(dim=1) - protos`
Update SOM 2021-06-09 16:21:12 +00:00			`delta = self._lr * self.hparams.alpha * nh.unsqueeze(-1) * diff`
[WIP] Add SOM 2021-06-07 16:44:15 +00:00			`updated_protos = protos + delta.sum(dim=0)`
			`self.proto_layer.load_state_dict({"_components": updated_protos},`
			`strict=False)`

Update SOM 2021-06-09 16:21:12 +00:00			`def training_epoch_end(self, training_step_outputs):`
			`self._sigma = self.hparams.sigma * np.exp(`
			`-self.current_epoch / self.trainer.max_epochs)`

[WIP] Add SOM 2021-06-07 16:44:15 +00:00			`def extra_repr(self):`
			`return f"(grid): (shape: {tuple(self._grid.shape)})"`


			`class HeskesSOM(UnsupervisedPrototypeModel):`
			`def __init__(self, hparams, **kwargs):`
			`super().__init__(hparams, **kwargs)`

			`def training_step(self, train_batch, batch_idx):`
			`# TODO Implement me!`
			`raise NotImplementedError()`


[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`class NeuralGas(UnsupervisedPrototypeModel):`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00			`def __init__(self, hparams, **kwargs):`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`super().__init__(hparams, **kwargs)`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`# Hyperparameters`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00			`self.save_hyperparameters(hparams)`

[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`# Default hparams`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00			`self.hparams.setdefault("agelimit", 10)`
			`self.hparams.setdefault("lm", 1)`
Use Components instead of Prototypes and refactor old examples 2021-04-29 15:05:41 +00:00
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00			`self.energy_layer = NeuralGasEnergy(lm=self.hparams.lm)`
			`self.topology_layer = ConnectionTopology(`
			`agelimit=self.hparams.agelimit,`
Use Components instead of Prototypes and refactor old examples 2021-04-29 15:05:41 +00:00			`num_prototypes=self.hparams.num_prototypes,`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00			`)`

			`def training_step(self, train_batch, batch_idx):`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`# x = train_batch`
			`# TODO Check if the batch has labels`
Use Components instead of Prototypes and refactor old examples 2021-04-29 15:05:41 +00:00			`x = train_batch[0]`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`d = self.compute_distances(x)`
[BUGFIX] Log loss in NG and GNG 2021-06-11 16:50:14 +00:00			`loss, _ = self.energy_layer(d)`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00			`self.topology_layer(d)`
[BUGFIX] Log loss in NG and GNG 2021-06-11 16:50:14 +00:00			`self.log("loss", loss)`
			`return loss`

			`# def training_epoch_end(self, training_step_outputs):`
			`# print(f"{self.trainer.lr_schedulers}")`
			`# print(f"{self.trainer.lr_schedulers[0]['scheduler'].optimizer}")`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00

			`class GrowingNeuralGas(NeuralGas):`
			`def __init__(self, hparams, **kwargs):`
			`super().__init__(hparams, **kwargs)`

[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`# Defaults`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00			`self.hparams.setdefault("step_reduction", 0.5)`
			`self.hparams.setdefault("insert_reduction", 0.1)`
			`self.hparams.setdefault("insert_freq", 10)`

[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`errors = torch.zeros(self.hparams.num_prototypes, device=self.device)`
			`self.register_buffer("errors", errors)`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00
			`def training_step(self, train_batch, _batch_idx):`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`# x = train_batch`
			`# TODO Check if the batch has labels`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00			`x = train_batch[0]`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`d = self.compute_distances(x)`
[BUGFIX] Log loss in NG and GNG 2021-06-11 16:50:14 +00:00			`loss, order = self.energy_layer(d)`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00			`winner = order[:, 0]`
			`mask = torch.zeros_like(d)`
			`mask[torch.arange(len(mask)), winner] = 1.0`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`dp = d * mask`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00
fix: training loss is a zero dimensional tensor Should fix the problem with EarlyStopping callback. 2021-06-25 14:56:10 +00:00			`self.errors += torch.sum(dp * dp)`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00			`self.errors *= self.hparams.step_reduction`

			`self.topology_layer(d)`
[BUGFIX] Log loss in NG and GNG 2021-06-11 16:50:14 +00:00			`self.log("loss", loss)`
			`return loss`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00
			`def configure_callbacks(self):`
			`return [`
			`GNGCallback(reduction=self.hparams.insert_reduction,`
			`freq=self.hparams.insert_freq)`
			`]`