Add style components from stylegan2

* styled convolution with mod and demod * pixelnorm * linear and conv layers with equalized learning rate
2021-02-26 16:21:30 -05:00 · 2021-02-26 16:21:30 -05:00 · a697845933
commit a697845933
parent 4706a902f6
1 changed files with 163 additions and 0 deletions
--- a/map2map/models/style.py
+++ b/map2map/models/style.py
@ -0,0 +1,163 @@
+import math
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+
+
+class PixelNorm(nn.Module):
+    """Pixelwise normalization after conv layers.
+
+    See ProGAN, StyleGAN.
+    """
+    def __init__(self):
+        super().__init__()
+
+    def forward(self, x, eps=1e-8):
+        return x * torch.rsqrt(x.pow(2).mean(dim=1, keepdim=True) + eps)
+
+
+class LinearElr(nn.Module):
+    """Linear layer with equalized learning rate.
+
+    See ProGAN, StyleGAN, and 1706.05350
+
+    Useful at all if not for regularization(1706.05350)?
+    """
+    def __init__(self, in_size, out_size, bias=True, act=None):
+        super().__init__()
+
+        self.weight = nn.Parameter(torch.randn(out_size, in_size))
+        self.wnorm = 1 / math.sqrt(in_size)
+
+        if bias:
+            self.bias = nn.Parameter(torch.zeros(out_size))
+        else:
+            self.register_parameter('bias', None)
+
+        self.act = act
+
+    def forward(self, x):
+        x = F.linear(x, self.weight * self.wnorm, bias=self.bias)
+
+        if self.act:
+            x = F.leaky_relu(x, negative_slope=0.2)
+
+        return x
+
+
+class ConvElr3d(nn.Module):
+    """Conv3d layer with equalized learning rate.
+
+    See ProGAN, StyleGAN, and 1706.05350
+
+    Useful at all if not for regularization(1706.05350)?
+    """
+    def __init__(self, in_chan, out_chan, kernel_size,
+                 stride=1, padding=0, bias=True):
+        super().__init__()
+
+        self.weight = nn.Parameter(
+            torch.randn(out_chan, in_chan, *(kernel_size,) * 3),
+        )
+        fan_in = in_chan * kernel_size ** 3
+        self.wnorm = 1 / math.sqrt(fan_in)
+
+        if bias:
+            self.bias = nn.Parameter(torch.zeros(out_chan))
+        else:
+            self.register_parameter('bias', None)
+
+        self.stride = stride
+        self.padding = padding
+
+    def forward(self, x):
+        x = F.conv2d(
+            x,
+            self.weight * self.wnorm,
+            bias=self.bias,
+            stride=self.stride,
+            padding=self.padding,
+        )
+
+        return x
+
+
+class ConvMod3d(nn.Module):
+    """Convolution layer with modulation and demodulation, from StyleGAN2.
+
+    Weight and bias initialization from `torch.nn._ConvNd.reset_parameters()`.
+    """
+    def __init__(self, style_size, in_chan, out_chan, kernel_size=3, stride=1,
+                 bias=True, resample=None):
+        super().__init__()
+
+        self.style_weight = nn.Parameter(torch.empty(in_chan, style_size))
+        nn.init.kaiming_uniform_(self.style_weight, a=math.sqrt(5),
+                                 mode='fan_in', nonlinearity='leaky_relu')
+        self.style_bias = nn.Parameter(torch.ones(in_chan))  # NOTE: init to 1
+
+        if resample is None:
+            K3 = (kernel_size,) * 3
+            self.weight = nn.Parameter(torch.empty(out_chan, in_chan, *K3))
+            self.stride = stride
+            self.conv = F.conv3d
+        elif resample == 'U':
+            K3 = (2,) * 3
+            # NOTE not clear to me why convtranspose have channels swapped
+            self.weight = nn.Parameter(torch.empty(in_chan, out_chan, *K3))
+            self.stride = 2
+            self.conv = F.conv_transpose3d
+        elif resample == 'D':
+            K3 = (2,) * 3
+            self.weight = nn.Parameter(torch.empty(out_chan, in_chan, *K3))
+            self.stride = 2
+            self.conv = F.conv3d
+        else:
+            raise ValueError('resample type {} not supported'.format(resample))
+        self.resample = resample
+
+        nn.init.kaiming_uniform_(
+            self.weight, a=math.sqrt(5),
+            mode='fan_in',  # effectively 'fan_out' for 'D'
+            nonlinearity='leaky_relu',
+        )
+
+        if bias:
+            self.bias = nn.Parameter(torch.zeros(out_chan))
+            fan_in, _ = nn.init._calculate_fan_in_and_fan_out(self.weight)
+            bound = 1 / math.sqrt(fan_in)
+            nn.init.uniform_(self.bias, -bound, bound)
+        else:
+            self.register_parameter('bias', None)
+
+    def forward(self, x, s, eps=1e-8):
+        N, Cin, *DHWin = x.shape
+        C0, C1, *K3 = self.weight.shape
+        if self.resample == 'U':
+            Cin, Cout = C0, C1
+        else:
+            Cout, Cin = C0, C1
+
+        s = F.linear(s, self.style_weight, bias=self.style_bias)
+
+        # modulation
+        if self.resample == 'U':
+            s = s.reshape(N, Cin, 1, 1, 1, 1)
+        else:
+            s = s.reshape(N, 1, Cin, 1, 1, 1)
+        w = self.weight * s
+
+        # demodulation
+        if self.resample == 'U':
+            fan_in_dim = (1, 3, 4, 5)
+        else:
+            fan_in_dim = (2, 3, 4, 5)
+        w = w * torch.rsqrt(w.pow(2).sum(dim=fan_in_dim, keepdim=True) + eps)
+
+        w = w.reshape(N * C0, C1, *K3)
+        x = x.reshape(1, N * Cin, *DHWin)
+        x = self.conv(x, w, bias=self.bias, stride=self.stride, groups=N)
+        _, _, *DHWout = x.shape
+        x = x.reshape(N, Cout, *DHWout)
+
+        return x