Merge pull request #12 from spencerwooo/decowa

spencerwooo · Sep 18, 2024 · 28e5a72 · 28e5a72
2 parents a0703f3 + 4a30516
commit 28e5a72
Show file tree

Hide file tree

Showing 3 changed files with 267 additions and 1 deletion.
diff --git a/README.md b/README.md
@@ -57,6 +57,7 @@ Gradient-based attacks:
 |     FIA      | $\ell_\infty$ | [Feature Importance-aware Transferable Adversarial Attacks](https://arxiv.org/abs/2107.14185)                                  | `torchattack.FIA`         |
 | PNA-PatchOut | $\ell_\infty$ | [Towards Transferable Adversarial Attacks on Vision Transformers](https://arxiv.org/abs/2109.04176)                            | `torchattack.PNAPatchOut` |
 |     TGR      | $\ell_\infty$ | [Transferable Adversarial Attacks on Vision Transformers with Token Gradient Regularization](https://arxiv.org/abs/2303.15754) | `torchattack.TGR`         |
+|    DeCoWA    | $\ell_\infty$ | [Boosting Adversarial Transferability across Model Genus by Deformation-Constrained Warping](https://arxiv.org/abs/2402.03951) | `torchattack.DeCoWA`      |
 
 Others:
 

diff --git a/src/torchattack/__init__.py b/src/torchattack/__init__.py
@@ -1,4 +1,5 @@
 from torchattack.admix import Admix
+from torchattack.decowa import DeCoWA
 from torchattack.deepfool import DeepFool
 from torchattack.difgsm import DIFGSM
 from torchattack.fgsm import FGSM
@@ -10,14 +11,17 @@
 from torchattack.pgdl2 import PGDL2
 from torchattack.pna_patchout import PNAPatchOut
 from torchattack.sinifgsm import SINIFGSM
+from torchattack.ssp import SSP
+from torchattack.tgr import TGR
 from torchattack.tifgsm import TIFGSM
 from torchattack.vmifgsm import VMIFGSM
 from torchattack.vnifgsm import VNIFGSM
 
-__version__ = '0.6.0'
+__version__ = '0.7.0'
 
 __all__ = [
     'Admix',
+    'DeCoWA',
     'DeepFool',
     'DIFGSM',
     'FIA',
@@ -29,6 +33,8 @@
     'PGDL2',
     'PNAPatchOut',
     'SINIFGSM',
+    'SSP',
+    'TGR',
     'TIFGSM',
     'VMIFGSM',
     'VNIFGSM',

diff --git a/src/torchattack/decowa.py b/src/torchattack/decowa.py
@@ -0,0 +1,259 @@
+from typing import Callable
+
+import torch
+import torch.nn as nn
+
+from torchattack.base import Attack
+
+
+class DeCoWA(Attack):
+    """The DeCoWA (Deformation-Constrained Warping Attack) attack.
+
+    From the paper 'Boosting Adversarial Transferability across Model Genus by
+    Deformation-Constrained Warping',
+    https://arxiv.org/abs/2402.03951
+
+    Args:
+        model: The model to attack.
+        normalize: A transform to normalize images.
+        device: Device to use for tensors. Defaults to cuda if available.
+        eps: The maximum perturbation. Defaults to 8/255.
+        steps: Number of steps. Defaults to 10.
+        alpha: Step size, `eps / steps` if None. Defaults to None.
+        decay: Decay factor for the momentum term. Defaults to 1.0.
+        mesh_width: Width of the control points. Defaults to 3.
+        mesh_height: Height of the control points. Defaults to 3.
+        rho: Regularization parameter for deformation. Defaults to 0.01.
+        num_warping: Number of warping transformation samples. Defaults to 20.
+        noise_scale: Scale of the random noise. Defaults to 2.
+        clip_min: Minimum value for clipping. Defaults to 0.0.
+        clip_max: Maximum value for clipping. Defaults to 1.0.
+        targeted: Targeted attack if True. Defaults to False.
+    """
+
+    def __init__(
+        self,
+        model: nn.Module,
+        normalize: Callable[[torch.Tensor], torch.Tensor] | None,
+        device: torch.device | None = None,
+        eps: float = 8 / 255,
+        steps: int = 10,
+        alpha: float | None = None,
+        decay: float = 1.0,
+        mesh_width: int = 3,
+        mesh_height: int = 3,
+        rho: float = 0.01,
+        num_warping: int = 20,
+        noise_scale: int = 2,
+        clip_min: float = 0.0,
+        clip_max: float = 1.0,
+        targeted: bool = False,
+    ):
+        super().__init__(normalize, device)
+
+        self.model = model
+        self.eps = eps
+        self.steps = steps
+        self.alpha = alpha
+        self.decay = decay
+        self.mesh_width = mesh_width
+        self.mesh_height = mesh_height
+        self.rho = rho
+        self.num_warping = num_warping
+        self.noise_scale = noise_scale
+        self.clip_min = clip_min
+        self.clip_max = clip_max
+        self.targeted = targeted
+        self.lossfn = nn.CrossEntropyLoss()
+
+    def forward(self, x: torch.Tensor, y: torch.Tensor) -> torch.Tensor:
+        """Perform MI-FGSM on a batch of images.
+
+        Args:
+            x: A batch of images. Shape: (N, C, H, W).
+            y: A batch of labels. Shape: (N).
+
+        Returns:
+            The perturbed images if successful. Shape: (N, C, H, W).
+        """
+
+        delta = torch.zeros_like(x, requires_grad=True)
+
+        # If alpha is not given, set to eps / steps
+        if self.alpha is None:
+            self.alpha = self.eps / self.steps
+
+        for _ in range(self.steps):
+            g = torch.zeros_like(x)
+
+            # Perform warping
+            for _ in range(self.num_warping):
+                # Apply warping to perturbation
+                noise_map = torch.rand([self.mesh_height - 2, self.mesh_width - 2, 2])
+                noise_map_hat = (noise_map - 0.5) * self.noise_scale
+
+                # Iterate for a round only
+                for _ in range(1):
+                    noise_map_hat.requires_grad_()
+
+                    vwt_x = self._vwt(x + delta, noise_map_hat)
+                    outs = self.model(self.normalize(vwt_x))
+                    loss = self.lossfn(outs, y)
+
+                    if self.targeted:
+                        loss = -loss
+
+                    loss.backward()
+
+                    if noise_map_hat.grad is None:
+                        continue
+
+                    noise_map_hat.detach_()
+                    noise_map_hat -= self.rho * noise_map_hat.grad
+
+                vwt_x = self._vwt(x + delta, noise_map_hat)
+
+                # Compute loss
+                outs = self.model(self.normalize(vwt_x))
+                loss = self.lossfn(outs, y)
+
+                if self.targeted:
+                    loss = -loss
+
+                # Compute gradient
+                loss.backward()
+
+                # Accumulate gradient
+                g += delta.grad
+
+            if delta.grad is None:
+                continue
+
+            # Average gradient over warping
+            g /= self.num_warping
+
+            # Apply momentum term
+            g = self.decay * g + delta.grad / torch.mean(
+                torch.abs(delta.grad), dim=(1, 2, 3), keepdim=True
+            )
+
+            # Update delta
+            delta.data = delta.data + self.alpha * g.sign()
+            delta.data = torch.clamp(delta.data, -self.eps, self.eps)
+            delta.data = torch.clamp(x + delta.data, self.clip_min, self.clip_max) - x
+
+            # Zero out gradient
+            delta.grad.detach_()
+            delta.grad.zero_()
+
+        return x + delta
+
+    def _vwt(self, x: torch.Tensor, noise_map: torch.Tensor) -> torch.Tensor:
+        n, _, w, h = x.size()
+
+        xx = self._grid_points_2d(self.mesh_width, self.mesh_height, self.device)
+        yy = self._noisy_grid(self.mesh_width, self.mesh_height, noise_map, self.device)
+
+        tpbs = TPS(size=(h, w), device=self.device)
+        warped_grid_b = tpbs(xx[None, ...], yy[None, ...])
+        warped_grid_b = warped_grid_b.repeat(n, 1, 1, 1)
+
+        vwt_x = torch.grid_sampler_2d(
+            input=x,
+            grid=warped_grid_b,
+            interpolation_mode=0,
+            padding_mode=0,
+            align_corners=False,
+        )
+
+        return vwt_x
+
+    def _grid_points_2d(
+        self, width: int, height: int, device: torch.device
+    ) -> torch.Tensor:
+        x = torch.linspace(-1, 1, width, device=device)
+        y = torch.linspace(-1, 1, height, device=device)
+
+        grid_x, grid_y = torch.meshgrid(x, y)
+        grid = torch.stack((grid_y, grid_x), dim=-1)
+
+        return grid.view(-1, 2)
+
+    def _noisy_grid(
+        self, width: int, height: int, noise_map: torch.Tensor, device: torch.device
+    ) -> torch.Tensor:
+        grid = self._grid_points_2d(width, height, device)
+        mod = torch.zeros([height, width, 2], device=device)
+        mod[1 : height - 1, 1 : width - 1, :] = noise_map
+        return grid + mod.reshape(-1, 2)
+
+
+def k_matrix(x: torch.Tensor, y: torch.Tensor) -> torch.Tensor:
+    eps = 1e-9
+    d2 = torch.pow(x[:, :, None, :] - y[:, None, :, :], 2).sum(-1)
+    k_mat = d2 * torch.log(d2 + eps)
+    return k_mat
+
+
+def p_matrix(x: torch.Tensor) -> torch.Tensor:
+    n, k = x.shape[:2]
+    p_mat = torch.ones(n, k, 3, device=x.device)
+    p_mat[:, :, 1:] = x
+    return p_mat
+
+
+class TPSCoeffs(nn.Module):
+    def __init__(self):
+        super().__init__()
+
+    def forward(
+        self, x: torch.Tensor, y: torch.Tensor
+    ) -> tuple[torch.Tensor, torch.Tensor]:
+        n, k = x.shape[:2]
+        z_mat = torch.zeros(1, k + 3, 2, device=x.device)
+        p_mat = torch.ones(n, k, 3, device=x.device)
+        l_mat = torch.zeros(n, k + 3, k + 3, device=x.device)
+        k_mat = k_matrix(x, x)
+
+        p_mat[:, :, 1:] = x
+        z_mat[:, :k, :] = y
+        l_mat[:, :k, :k] = k_mat
+        l_mat[:, :k, k:] = p_mat
+        l_mat[:, k:, :k] = p_mat.permute(0, 2, 1)
+
+        q_mat = torch.linalg.solve(l_mat, z_mat)
+        return q_mat[:, :k], q_mat[:, k:]
+
+
+class TPS(nn.Module):
+    def __init__(self, size: tuple = (256, 256), device: torch.device | None = None):
+        super().__init__()
+        h, w = size
+        self.size = size
+        self.device = device
+
+        self.tps = TPSCoeffs()
+
+        grid = torch.ones(1, h, w, 2, device=device)
+        grid[:, :, :, 0] = torch.linspace(-1, 1, w, device=device)
+        grid[:, :, :, 1] = torch.linspace(-1, 1, h, device=device)[..., None]
+        self.grid = grid.view(-1, h * w, 2)
+
+    def forward(self, x: torch.Tensor, y: torch.Tensor) -> torch.Tensor:
+        h, w = self.size
+        w_mat, a_mat = self.tps(x, y)
+        u_mat = k_matrix(self.grid, x)
+        p_mat = p_matrix(self.grid)
+        grid = p_mat @ a_mat + u_mat @ w_mat
+        return grid.view(-1, h, w, 2)
+
+
+if __name__ == '__main__':
+    from torchattack.eval import run_attack
+
+    run_attack(
+        attack=DeCoWA,
+        attack_cfg={'eps': 16 / 255, 'steps': 10},
+        model_name='resnet50',
+        victim_model_names=['resnet18', 'vit_b_16'],
+    )