catalyst-team · Scitator · Jul 15, 2021 · Oct 7, 2020 · Oct 11, 2020 · Oct 11, 2020
@@ -16,6 +16,7 @@
 from catalyst.callbacks.batch_transform import BatchTransformCallback
 from catalyst.callbacks.checkpoint import ICheckpointCallback, CheckpointCallback
 from catalyst.callbacks.control_flow import ControlFlowCallback
+from catalyst.callbacks.mixup import MixupCallback
 from catalyst.callbacks.criterion import ICriterionCallback, CriterionCallback
 from catalyst.callbacks.metric import (
     BatchMetricCallback,

@@ -1,101 +1,190 @@
-# from typing import List
-#
-# import numpy as np
-# import torch
-#
-# from catalyst.callbacks.criterion import CriterionCallback
-# from catalyst.core.runner import IRunner
-#
-#
-# class MixupCallback(CriterionCallback):
-#     """Callback to do mixup augmentation.
-#
-#     More details about mixin can be found in the paper
-#     `mixup: Beyond Empirical Risk Minimization`_.
-#
-#     .. warning::
-#         `catalyst.contrib.callbacks.MixupCallback` is inherited from
-#         `catalyst.callbacks.CriterionCallback` and does its work.
-#         You may not use them together.
-#
-#     .. _mixup\: Beyond Empirical Risk Minimization:  # noqa: W605
-#         https://arxiv.org/abs/1710.09412
-#     """
-#
-#     def __init__(
-#         self,
-#         input_key: str = "targets",
-#         output_key: str = "logits",
-#         fields: List[str] = ("features"),
-#         alpha=1.0,
-#         on_train_only=True,
-#         **kwargs
-#     ):
-#         """
-#         Args:
-#             fields: list of features which must be affected.
-#             alpha: beta distribution a=b parameters.
-#                 Must be >=0. The more alpha closer to zero
-#                 the less effect of the mixup.
-#             on_train_only: Apply to train only.
-#                 As the mixup use the proxy inputs, the targets are also proxy.
-#                 We are not interested in them, are we?
-#                 So, if on_train_only is True, use a standard output/metric
-#                 for validation.
-#         """
-#         assert isinstance(input_key, str) and isinstance(output_key, str)
-#         assert len(fields) > 0, "At least one field for MixupCallback is required"
-#         assert alpha >= 0, "alpha must be>=0"
-#
-#         super().__init__(input_key=input_key, input_key=output_key, **kwargs)
-#
-#         self.on_train_only = on_train_only
-#         self.fields = fields
-#         self.alpha = alpha
-#         self.lam = 1
-#         self.index = None
-#         self.is_needed = True
-#
-#     def _compute_loss_value(self, runner: "IRunner", criterion):
-#         if not self.is_needed:
-#             return super()._compute_loss_value(runner, criterion)
-#
-#         pred = runner.output[self.input_key]
-#         y_a = runner.input[self.input_key]
-#         y_b = runner.input[self.input_key][self.index]
-#
-#         loss = self.lam * criterion(pred, y_a) + (1 - self.lam) * criterion(pred, y_b)
-#         return loss
-#
-#     def on_loader_start(self, runner: "IRunner"):
-#         """Loader start hook.
-#
-#         Args:
-#             runner: current runner
-#         """
-#         self.is_needed = not self.on_train_only or runner.is_train_loader
-#
-#     def on_batch_start(self, runner: "IRunner") -> None:
-#         """Batch start hook.
-#
-#         Args:
-#             runner: current runner
-#         """
-#         if not self.is_needed:
-#             return
-#
-#         if self.alpha > 0:
-#             self.lam = np.random.beta(self.alpha, self.alpha)
-#         else:
-#             self.lam = 1
-#
-#         self.index = torch.randperm(runner.input[self.fields[0]].shape[0])
-#         self.index.to(runner.device)
-#
-#         for f in self.fields:
-#             runner.input[f] = (
-#                 self.lam * runner.input[f] + (1 - self.lam) * runner.input[f][self.index]
-#             )
-#
-#
-# __all__ = ["MixupCallback"]
+from typing import List, Union
+
+import numpy as np
+import torch
+
+from catalyst.core import Callback, CallbackOrder, IRunner
+
+
+class MixupCallback(Callback):
+    """
+    Callback to do mixup augmentation. More details about mixin can be found in the paper
+    `mixup: Beyond Empirical Risk Minimization.
+
+    Examples:
+
+    .. code-block:: python
+
+        import os
+        import numpy as np
+        import torch
+        from torch import nn
+        from torch.utils.data import DataLoader
+        from catalyst import dl
+        from catalyst.callbacks import MixupCallback
+        from catalyst.data.transforms import ToTensor
+        from catalyst.contrib.datasets import MNIST
+        from typing import Dict, Any
+
+
+        class SimpleNet(nn.Module):
+
+            def __init__(self, in_channels, in_hw, out_features):
+                super().__init__()
+                self.encoder = nn.Sequential(nn.Conv2d(in_channels, in_channels, 3, 1, 1),
+                                             nn.Tanh())
+                self.clf = nn.Linear(in_channels * in_hw * in_hw, out_features)
+
+            def forward(self, x):
+                z = self.encoder(x)
+                z_ = z.view(z.size(0), -1)
+                y_hat = self.clf(z_)
+                return y_hat
+
+
+        class SimpleDataset(torch.utils.data.Dataset):
+            def __init__(self, train: bool = False):
+                self.mnist = MNIST(os.getcwd(), train=train, download=True, transform=ToTensor())
+
+            def __len__(self) -> int:
+                return len(self.mnist)
+
+            def __getitem__(self, idx: int) -> Dict[str, Any]:
+                x, y = self.mnist.__getitem__(idx)
+                y_one_hot = np.zeros(10)
+                y_one_hot[y] = 1
+                return {'image': x,
+                        'clf_targets': y,
+                        'clf_targets_one_hot': torch.Tensor(y_one_hot)}
+
+
+        model = SimpleNet(1, 28, 10)
+        criterion = torch.nn.BCEWithLogitsLoss()
+        optimizer = torch.optim.Adam(model.parameters(), lr=0.02)
+
+        loaders = {
+            "train": DataLoader(SimpleDataset(train=True), batch_size=32),
+            "valid": DataLoader(SimpleDataset(train=False), batch_size=32),
+        }
+
+
+        class CustomRunner(dl.Runner):
+
+            def handle_batch(self, batch):
+                image = batch['image']
+                clf_logits = self.model(image)
+                self.batch['clf_logits'] = clf_logits
+
+
+        runner = CustomRunner()
+        runner.train(
+            loaders=loaders,
+            model=model,
+            criterion=criterion,
+            optimizer=optimizer,
+            logdir="./logdir14",
+            num_epochs=2,
+            verbose=True,
+            valid_loader="valid",
+            valid_metric="loss",
+            minimize_valid_metric=True,
+            callbacks={
+                "mixup": MixupCallback(keys=['image', 'clf_targets_one_hot']),
+                "criterion": dl.CriterionCallback(
+                    metric_key="loss",
+                    input_key="clf_logits",
+                    target_key="clf_targets_one_hot",
+                ),
+                "optimizer": dl.OptimizerCallback(metric_key="loss"),
+                "classification": dl.ControlFlowCallback(
+                    dl.PrecisionRecallF1SupportCallback(input_key="clf_logits",
+                                                        target_key="clf_targets",
+                                                        num_classes=10, ),
+                    ignore_loaders='train',
+                ),
+
+            },
+        )
+
+    .. note::
+        Callback can only be used with an even batch size
+        With running this callback, many metrics (for example, accuracy) become undefined, so
+        use ControlFlowCallback in order to evaluate model(see example)
+
+    """
+
+    def __init__(
+        self, keys: Union[str, List[str]], alpha=0.2, mode="replace", on_train_only=True, **kwargs,
+    ):
+        """
+
+        Args:
+            keys: batch keys to which you want to apply augmentation
+            alpha: beta distribution a=b parameters. Must be >=0. The more alpha closer to zero the
+            less effect of the mixup.
+            mode: mode determines the method of use. Must be in ["replace", "add"]. If "replace"
+            then replaces the batch with a mixed one, while the batch size is not changed
+            If "add", concatenates mixed examples to the current ones, the batch size increases by
+            s times.
+            on_train_only: apply to train only. As the mixup use the proxy inputs, the targets are
+            also proxy. We are not interested in them, are we? So, if on_train_only is True, use a
+            standard output/metric for validation.
+            **kwargs:
+        """
+        assert isinstance(keys, (str, list)), f"keys must be str of list[str], get: {type(keys)}"
+        assert alpha >= 0, "alpha must be>=0"
+        assert mode in ["add", "replace"], f"mode must be in 'add', 'replace', get: {mode}"
+        super().__init__(order=CallbackOrder.Internal)
+        if isinstance(keys, str):
+            keys = [keys]
+        self.keys = keys
+        self.on_train_only = on_train_only
+        self.alpha = alpha
+        self.mode = mode
+        self.is_needed = True
+
+    def _handle_batch(self, runner: "IRunner") -> None:
+        """
+        Applies mixup augmentation for a batch
+
+        Args:
+            runner: runner for the experiment.
+        """
+        batch_size = runner.batch[self.keys[0]].shape[0]
+        beta = np.random.beta(self.alpha, self.alpha, batch_size).astype(np.float32)
+        indexes = np.array(list(range(batch_size)))
+        # index shift by 1
+        indexes_2 = (indexes + 1) % batch_size
+        for key in self.keys:
+            targets = runner.batch[key]
+            targets_shape = [batch_size] + [1] * len(targets.shape[1:])
+            key_beta = beta.reshape(targets_shape)
+            targets = targets * key_beta + targets[indexes_2] * (1 - key_beta)
+
+            if self.mode == "replace":
+                runner.batch[key] = targets
+            else:
+                # self.mode == 'add'
+                runner.batch[key] = torch.cat([runner.batch[key], targets])
+
+    def on_loader_start(self, runner: "IRunner") -> None:
+        """
+        Loader start hook.
+
+        Args:
+            runner: current runner
+        """
+        self.is_needed = not self.on_train_only or runner.is_train_loader
+
+    def on_batch_start(self, runner: "IRunner") -> None:
+        """
+        On batch start action.
+
+        Args:
+            runner: runner for the experiment.
+        """
+        if self.is_needed:
+            self._handle_batch(runner)
+
+
+__all__ = ["MixupCallback"]