Move out label_smoothing and try roll instead of flip

datumbox · datumbox · commit 6f2ebeaadf6f · 2021-09-09T18:32:45.000+01:00
diff --git a/test/test_transforms_tensor.py b/test/test_transforms_tensor.py
@@ -728,15 +728,14 @@ def test_gaussian_blur(device, meth_kwargs):
     {"mixup_alpha": 0.0, "cutmix_alpha": 1.0},
     {"mixup_alpha": 1.0, "cutmix_alpha": 0.0},
 ])
-@pytest.mark.parametrize('label_smoothing', [0.0, 0.1])
 @pytest.mark.parametrize('inplace', [True, False])
-def test_random_mixupcutmix(device, alphas, label_smoothing, inplace):
+def test_random_mixupcutmix(device, alphas, inplace):
     batch_size = 32
     num_classes = 10
     batch = torch.rand(batch_size, 3, 44, 56, device=device)
     targets = torch.randint(num_classes, (batch_size, ), device=device, dtype=torch.int64)
 
-    fn = T.RandomMixupCutmix(num_classes, label_smoothing=label_smoothing, inplace=inplace, **alphas)
+    fn = T.RandomMixupCutmix(num_classes, inplace=inplace, **alphas)
     scripted_fn = torch.jit.script(fn)
 
     seed = torch.seed()
@@ -763,8 +762,6 @@ def test_random_mixupcutmix_with_invalid_data():
         t(torch.rand(32, 3, 60, 60), torch.randint(10, (32, 1)))
     with pytest.raises(ValueError, match="Target dtype should be torch.int64."):
         t(torch.rand(32, 3, 60, 60), torch.randint(10, (32, ), dtype=torch.int32))
-    with pytest.raises(ValueError, match="The batch size should be even."):
-        t(torch.rand(31, 3, 60, 60), torch.randint(10, (31, )))
 
 
 def test_random_mixupcutmix_with_real_data():
@@ -779,7 +776,7 @@ def test_random_mixupcutmix_with_real_data():
     dataset = TensorDataset(torch.stack(images).to(torch.float32), torch.tensor([0, 1]))
 
     # Use mixup in the collate
-    mixup = T.RandomMixupCutmix(2, cutmix_alpha=1.0, mixup_alpha=1.0, label_smoothing=0.1)
+    mixup = T.RandomMixupCutmix(2, cutmix_alpha=1.0, mixup_alpha=1.0)
     dataloader = DataLoader(dataset, batch_size=2,
                             collate_fn=lambda batch: mixup(*(torch.stack(x) for x in zip(*batch))))
 
@@ -791,5 +788,5 @@ def test_random_mixupcutmix_with_real_data():
 
     torch.testing.assert_close(
         torch.stack(stats).mean(dim=0),
-        torch.tensor([46.94434738, 64.79092407, 0.23949696])
+        torch.tensor([46.931968688964844, 69.97343444824219, 0.459820032119751])
     )
diff --git a/torchvision/transforms/transforms.py b/torchvision/transforms/transforms.py
@@ -1971,15 +1971,13 @@ class RandomMixupCutmix(torch.nn.Module):
             Default value is 0.5.
         cutmix_alpha (float): hyperparameter of the Beta distribution used for cutmix.
             Set to 0.0 to turn off. Default value is 0.0.
-        label_smoothing (float): the amount of smoothing using when one-hot encoding.
-            Set to 0.0 to turn off. Default value is 0.0.
         inplace (bool): boolean to make this transform inplace. Default set to False.
     """
 
     def __init__(self, num_classes: int,
                  p: float = 1.0, mixup_alpha: float = 1.0,
                  cutmix_p: float = 0.5, cutmix_alpha: float = 0.0,
-                 label_smoothing: float = 0.0, inplace: bool = False) -> None:
+                 inplace: bool = False) -> None:
         super().__init__()
         assert num_classes > 0, "Please provide a valid positive value for the num_classes."
         assert mixup_alpha > 0 or cutmix_alpha > 0, "Both alpha params can't be zero."
@@ -1989,16 +1987,8 @@ def __init__(self, num_classes: int,
         self.mixup_alpha = mixup_alpha
         self.cutmix_p = cutmix_p
         self.cutmix_alpha = cutmix_alpha
-        self.label_smoothing = label_smoothing
         self.inplace = inplace
 
-    def _smooth_one_hot(self, target: Tensor) -> Tensor:
-        N = target.shape[0]
-        device = target.device
-        v = torch.full(size=(N, 1), fill_value=1 - self.label_smoothing, device=device)
-        return torch.full(size=(N, self.num_classes), fill_value=self.label_smoothing / self.num_classes,
-                          device=device).scatter_add_(1, target.unsqueeze(1), v)
-
     def forward(self, batch: Tensor, target: Tensor) -> Tuple[Tensor, Tensor]:
         """
         Args:
@@ -2014,21 +2004,18 @@ def forward(self, batch: Tensor, target: Tensor) -> Tuple[Tensor, Tensor]:
             raise ValueError("Target ndim should be 1. Got {}".format(target.ndim))
         elif target.dtype != torch.int64:
             raise ValueError("Target dtype should be torch.int64. Got {}".format(target.dtype))
-        elif batch.size(0) % 2 != 0:
-            # speed optimization, see below
-            raise ValueError("The batch size should be even.")
 
         if not self.inplace:
             batch = batch.clone()
             # target = target.clone()
 
-        target = self._smooth_one_hot(target)
+        target = torch.nn.functional.one_hot(target, num_classes=self.num_classes).to(dtype=torch.float32)
         if torch.rand(1).item() >= self.p:
             return batch, target
 
-        # It's faster to flip the batch instead of shuffling it to create image pairs
-        batch_flipped = batch.flip(0)
-        target_flipped = target.flip(0)
+        # It's faster to roll the batch by one instead of shuffling it to create image pairs
+        batch_flipped = batch.roll(1)
+        target_flipped = target.roll(1)
 
         if self.mixup_alpha <= 0.0:
             use_mixup = False
@@ -2072,7 +2059,6 @@ def __repr__(self) -> str:
         s += ', mixup_alpha={mixup_alpha}'
         s += ', cutmix_p={cutmix_p}'
         s += ', cutmix_alpha={cutmix_alpha}'
-        s += ', label_smoothing={label_smoothing}'
         s += ', inplace={inplace}'
         s += ')'
         return s.format(**self.__dict__)