prototorch_models/prototorch/models/unsupervised.py

"""Unsupervised prototype learning algorithms."""

import numpy as np
import torch
from prototorch.core.competitions import wtac
from prototorch.core.distances import squared_euclidean_distance
from prototorch.core.losses import NeuralGasEnergy

from .abstract import UnsupervisedPrototypeModel
from .callbacks import GNGCallback
from .extras import ConnectionTopology
from .mixins import NonGradientMixin


class KohonenSOM(NonGradientMixin, UnsupervisedPrototypeModel):
    """Kohonen Self-Organizing-Map.

    TODO Allow non-2D grids

    """
    _grid: torch.Tensor

    def __init__(self, hparams, **kwargs):
        h, w = hparams.get("shape")
        # Ignore `num_prototypes`
        hparams["num_prototypes"] = h * w
        distance_fn = kwargs.pop("distance_fn", squared_euclidean_distance)
        super().__init__(hparams, distance_fn=distance_fn, **kwargs)

        # Hyperparameters
        self.save_hyperparameters(hparams)

        # Default hparams
        self.hparams.setdefault("alpha", 0.3)
        self.hparams.setdefault("sigma", max(h, w) / 2.0)

        # Additional parameters
        x, y = torch.arange(h), torch.arange(w)
        grid = torch.stack(torch.meshgrid(x, y, indexing="ij"), dim=-1)
        self.register_buffer("_grid", grid)
        self._sigma = self.hparams.sigma
        self._lr = self.hparams.lr

    def predict_from_distances(self, distances):
        grid = self._grid.view(-1, 2)
        wp = wtac(distances, grid)
        return wp

    def training_step(self, train_batch, batch_idx):
        # x = train_batch
        # TODO Check if the batch has labels
        x = train_batch[0]
        d = self.compute_distances(x)
        wp = self.predict_from_distances(d)
        grid = self._grid.view(-1, 2)
        gd = squared_euclidean_distance(wp, grid)
        nh = torch.exp(-gd / self._sigma**2)
        protos = self.proto_layer()
        diff = x.unsqueeze(dim=1) - protos
        delta = self._lr * self.hparams.alpha * nh.unsqueeze(-1) * diff
        updated_protos = protos + delta.sum(dim=0)
        self.proto_layer.load_state_dict(
            {"_components": updated_protos},
            strict=False,
        )

    def training_epoch_end(self, training_step_outputs):
        self._sigma = self.hparams.sigma * np.exp(
            -self.current_epoch / self.trainer.max_epochs)

    def extra_repr(self):
        return f"(grid): (shape: {tuple(self._grid.shape)})"


class HeskesSOM(UnsupervisedPrototypeModel):

    def __init__(self, hparams, **kwargs):
        super().__init__(hparams, **kwargs)

    def training_step(self, train_batch, batch_idx):
        # TODO Implement me!
        raise NotImplementedError()


class NeuralGas(UnsupervisedPrototypeModel):

    def __init__(self, hparams, **kwargs):
        super().__init__(hparams, **kwargs)

        # Hyperparameters
        self.save_hyperparameters(hparams)

        # Default hparams
        self.hparams.setdefault("age_limit", 10)
        self.hparams.setdefault("lm", 1)

        self.energy_layer = NeuralGasEnergy(lm=self.hparams["lm"])
        self.topology_layer = ConnectionTopology(
            agelimit=self.hparams["age_limit"],
            num_prototypes=self.hparams["num_prototypes"],
        )

    def training_step(self, train_batch, batch_idx):
        # x = train_batch
        # TODO Check if the batch has labels
        x = train_batch[0]
        d = self.compute_distances(x)
        loss, _ = self.energy_layer(d)
        self.topology_layer(d)
        self.log("loss", loss)
        return loss


class GrowingNeuralGas(NeuralGas):
    errors: torch.Tensor

    def __init__(self, hparams, **kwargs):
        super().__init__(hparams, **kwargs)

        # Defaults
        self.hparams.setdefault("step_reduction", 0.5)
        self.hparams.setdefault("insert_reduction", 0.1)
        self.hparams.setdefault("insert_freq", 10)

        errors = torch.zeros(
            self.hparams["num_prototypes"],
            device=self.device,
        )
        self.register_buffer("errors", errors)

    def training_step(self, train_batch, _batch_idx):
        # x = train_batch
        # TODO Check if the batch has labels
        x = train_batch[0]
        d = self.compute_distances(x)
        loss, order = self.energy_layer(d)
        winner = order[:, 0]
        mask = torch.zeros_like(d)
        mask[torch.arange(len(mask)), winner] = 1.0
        dp = d * mask

        self.errors += torch.sum(dp * dp)
        self.errors *= self.hparams["step_reduction"]

        self.topology_layer(d)
        self.log("loss", loss)
        return loss

    def configure_callbacks(self):
        return [
            GNGCallback(
                reduction=self.hparams["insert_reduction"],
                freq=self.hparams["insert_freq"],
            )
        ]
Update Documentation Clean up project 2021-05-21 13:42:45 +00:00			`"""Unsupervised prototype learning algorithms."""`

Update SOM 2021-06-09 16:21:12 +00:00			`import numpy as np`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00			`import torch`
chore: replace relative imports 2022-05-16 09:12:53 +00:00			`from prototorch.core.competitions import wtac`
			`from prototorch.core.distances import squared_euclidean_distance`
			`from prototorch.core.losses import NeuralGasEnergy`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00
chore: move mixins to seperate file 2022-05-17 14:19:47 +00:00			`from .abstract import UnsupervisedPrototypeModel`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`from .callbacks import GNGCallback`
			`from .extras import ConnectionTopology`
chore: move mixins to seperate file 2022-05-17 14:19:47 +00:00			`from .mixins import NonGradientMixin`
Use Components instead of Prototypes and refactor old examples 2021-04-29 15:05:41 +00:00
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00
[WIP] Add SOM 2021-06-07 16:44:15 +00:00			`class KohonenSOM(NonGradientMixin, UnsupervisedPrototypeModel):`
			`"""Kohonen Self-Organizing-Map.`

			`TODO Allow non-2D grids`

			`"""`
chore: minor updates and version updates 2022-05-17 10:00:52 +00:00			`_grid: torch.Tensor`
ci: add github actions (#16) * chore: update pre-commit versions * ci: remove old configurations * ci: copy workflow from prototorch * ci: run precommit for all files * ci: add examples CPU test * ci(test): failing example test * ci: fix workflow definition * ci(test): repeat failing example test * ci: fix workflow definition * ci(test): repeat failing example test II * ci: fix test command * ci: cleanup example test * ci: remove travis badge 2022-01-11 17:28:50 +00:00
[WIP] Add SOM 2021-06-07 16:44:15 +00:00			`def __init__(self, hparams, **kwargs):`
			`h, w = hparams.get("shape")`
			# Ignore `num_prototypes`
			`hparams["num_prototypes"] = h * w`
			`distance_fn = kwargs.pop("distance_fn", squared_euclidean_distance)`
			`super().__init__(hparams, distance_fn=distance_fn, **kwargs)`

			`# Hyperparameters`
			`self.save_hyperparameters(hparams)`

			`# Default hparams`
			`self.hparams.setdefault("alpha", 0.3)`
			`self.hparams.setdefault("sigma", max(h, w) / 2.0)`

			`# Additional parameters`
			`x, y = torch.arange(h), torch.arange(w)`
test: add unit tests 2022-03-30 13:12:33 +00:00			`grid = torch.stack(torch.meshgrid(x, y, indexing="ij"), dim=-1)`
[WIP] Add SOM 2021-06-07 16:44:15 +00:00			`self.register_buffer("_grid", grid)`
Update SOM 2021-06-09 16:21:12 +00:00			`self._sigma = self.hparams.sigma`
			`self._lr = self.hparams.lr`
[WIP] Add SOM 2021-06-07 16:44:15 +00:00
			`def predict_from_distances(self, distances):`
			`grid = self._grid.view(-1, 2)`
			`wp = wtac(distances, grid)`
			`return wp`

			`def training_step(self, train_batch, batch_idx):`
			`# x = train_batch`
			`# TODO Check if the batch has labels`
			`x = train_batch[0]`
			`d = self.compute_distances(x)`
			`wp = self.predict_from_distances(d)`
			`grid = self._grid.view(-1, 2)`
			`gd = squared_euclidean_distance(wp, grid)`
Update SOM 2021-06-09 16:21:12 +00:00			`nh = torch.exp(-gd / self._sigma**2)`
fix: All examples should work on CPU and GPU now 2021-08-05 09:20:02 +00:00			`protos = self.proto_layer()`
[WIP] Add SOM 2021-06-07 16:44:15 +00:00			`diff = x.unsqueeze(dim=1) - protos`
Update SOM 2021-06-09 16:21:12 +00:00			`delta = self._lr * self.hparams.alpha * nh.unsqueeze(-1) * diff`
[WIP] Add SOM 2021-06-07 16:44:15 +00:00			`updated_protos = protos + delta.sum(dim=0)`
chore: fix errors for pytorch_lightning>1.6 2022-04-27 07:25:42 +00:00			`self.proto_layer.load_state_dict(`
			`{"_components": updated_protos},`
			`strict=False,`
			`)`
[WIP] Add SOM 2021-06-07 16:44:15 +00:00
Update SOM 2021-06-09 16:21:12 +00:00			`def training_epoch_end(self, training_step_outputs):`
			`self._sigma = self.hparams.sigma * np.exp(`
			`-self.current_epoch / self.trainer.max_epochs)`

[WIP] Add SOM 2021-06-07 16:44:15 +00:00			`def extra_repr(self):`
			`return f"(grid): (shape: {tuple(self._grid.shape)})"`


			`class HeskesSOM(UnsupervisedPrototypeModel):`
ci: add github actions (#16) * chore: update pre-commit versions * ci: remove old configurations * ci: copy workflow from prototorch * ci: run precommit for all files * ci: add examples CPU test * ci(test): failing example test * ci: fix workflow definition * ci(test): repeat failing example test * ci: fix workflow definition * ci(test): repeat failing example test II * ci: fix test command * ci: cleanup example test * ci: remove travis badge 2022-01-11 17:28:50 +00:00
[WIP] Add SOM 2021-06-07 16:44:15 +00:00			`def __init__(self, hparams, **kwargs):`
			`super().__init__(hparams, **kwargs)`

			`def training_step(self, train_batch, batch_idx):`
			`# TODO Implement me!`
			`raise NotImplementedError()`


[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`class NeuralGas(UnsupervisedPrototypeModel):`
ci: add github actions (#16) * chore: update pre-commit versions * ci: remove old configurations * ci: copy workflow from prototorch * ci: run precommit for all files * ci: add examples CPU test * ci(test): failing example test * ci: fix workflow definition * ci(test): repeat failing example test * ci: fix workflow definition * ci(test): repeat failing example test II * ci: fix test command * ci: cleanup example test * ci: remove travis badge 2022-01-11 17:28:50 +00:00
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00			`def __init__(self, hparams, **kwargs):`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`super().__init__(hparams, **kwargs)`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`# Hyperparameters`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00			`self.save_hyperparameters(hparams)`

[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`# Default hparams`
test: add unit tests 2022-03-30 13:12:33 +00:00			`self.hparams.setdefault("age_limit", 10)`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00			`self.hparams.setdefault("lm", 1)`
Use Components instead of Prototypes and refactor old examples 2021-04-29 15:05:41 +00:00
chore: minor updates and version updates 2022-05-17 10:00:52 +00:00			`self.energy_layer = NeuralGasEnergy(lm=self.hparams["lm"])`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00			`self.topology_layer = ConnectionTopology(`
chore: minor updates and version updates 2022-05-17 10:00:52 +00:00			`agelimit=self.hparams["age_limit"],`
			`num_prototypes=self.hparams["num_prototypes"],`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00			`)`

			`def training_step(self, train_batch, batch_idx):`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`# x = train_batch`
			`# TODO Check if the batch has labels`
Use Components instead of Prototypes and refactor old examples 2021-04-29 15:05:41 +00:00			`x = train_batch[0]`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`d = self.compute_distances(x)`
[BUGFIX] Log loss in NG and GNG 2021-06-11 16:50:14 +00:00			`loss, _ = self.energy_layer(d)`
Add Neural Gas Model. 2021-04-23 15:30:23 +00:00			`self.topology_layer(d)`
[BUGFIX] Log loss in NG and GNG 2021-06-11 16:50:14 +00:00			`self.log("loss", loss)`
			`return loss`

[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00
			`class GrowingNeuralGas(NeuralGas):`
chore: minor updates and version updates 2022-05-17 10:00:52 +00:00			`errors: torch.Tensor`
ci: add github actions (#16) * chore: update pre-commit versions * ci: remove old configurations * ci: copy workflow from prototorch * ci: run precommit for all files * ci: add examples CPU test * ci(test): failing example test * ci: fix workflow definition * ci(test): repeat failing example test * ci: fix workflow definition * ci(test): repeat failing example test II * ci: fix test command * ci: cleanup example test * ci: remove travis badge 2022-01-11 17:28:50 +00:00
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00			`def __init__(self, hparams, **kwargs):`
			`super().__init__(hparams, **kwargs)`

[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`# Defaults`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00			`self.hparams.setdefault("step_reduction", 0.5)`
			`self.hparams.setdefault("insert_reduction", 0.1)`
			`self.hparams.setdefault("insert_freq", 10)`

chore: minor updates and version updates 2022-05-17 10:00:52 +00:00			`errors = torch.zeros(`
			`self.hparams["num_prototypes"],`
			`device=self.device,`
			`)`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`self.register_buffer("errors", errors)`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00
			`def training_step(self, train_batch, _batch_idx):`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`# x = train_batch`
			`# TODO Check if the batch has labels`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00			`x = train_batch[0]`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`d = self.compute_distances(x)`
[BUGFIX] Log loss in NG and GNG 2021-06-11 16:50:14 +00:00			`loss, order = self.energy_layer(d)`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00			`winner = order[:, 0]`
			`mask = torch.zeros_like(d)`
			`mask[torch.arange(len(mask)), winner] = 1.0`
[REFACTOR] Major cleanup 2021-06-04 20:20:32 +00:00			`dp = d * mask`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00
fix: training loss is a zero dimensional tensor Should fix the problem with EarlyStopping callback. 2021-06-25 14:56:10 +00:00			`self.errors += torch.sum(dp * dp)`
chore: minor updates and version updates 2022-05-17 10:00:52 +00:00			`self.errors *= self.hparams["step_reduction"]`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00
			`self.topology_layer(d)`
[BUGFIX] Log loss in NG and GNG 2021-06-11 16:50:14 +00:00			`self.log("loss", loss)`
			`return loss`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00
			`def configure_callbacks(self):`
			`return [`
chore: fix errors for pytorch_lightning>1.6 2022-04-27 07:25:42 +00:00			`GNGCallback(`
chore: minor updates and version updates 2022-05-17 10:00:52 +00:00			`reduction=self.hparams["insert_reduction"],`
			`freq=self.hparams["insert_freq"],`
chore: fix errors for pytorch_lightning>1.6 2022-04-27 07:25:42 +00:00			`)`
[FEATURE] Add Growing Neural Gas 2021-06-01 15:19:43 +00:00			`]`