Rewrote model classes for simplicity

DanielHalachev · DanielHalachev · commit 8dd7a99bb6ae · 2023-12-20T09:59:40.000+02:00
diff --git a/models.py b/models.py
@@ -4,34 +4,33 @@
 
 
 class UnetBlock(nn.Module):
-    def __init__(self, nf, ni, submodule=None, input_c=None, dropout=False,
-                 innermost=False, outermost=False):
+    def __init__(self, nf, ni, submodule=None, input_channels=None, dropout=False, innermost=False, outermost=False):
         super().__init__()
         self.outermost = outermost
-        if input_c is None: input_c = nf
-        downconv = nn.Conv2d(input_c, ni, kernel_size=4,
-                             stride=2, padding=1, bias=False)
-        downrelu = nn.LeakyReLU(0.2, True)
-        downnorm = nn.BatchNorm2d(ni)
-        uprelu = nn.ReLU(True)
-        upnorm = nn.BatchNorm2d(nf)
+        if input_channels is None:
+            input_channels = nf
+        down_convolution = nn.Conv2d(input_channels, ni, kernel_size=4, stride=2, padding=1, bias=False)
+        down_relu = nn.LeakyReLU(0.2, True)
+        down_normalization = nn.BatchNorm2d(ni)
+        up_relu = nn.ReLU(True)
+        up_norm = nn.BatchNorm2d(nf)
 
         if outermost:
-            upconv = nn.ConvTranspose2d(ni * 2, nf, kernel_size=4, stride=2, padding=1)
-            down = [downconv]
-            up = [uprelu, upconv, nn.Tanh()]
+            up_convolution = nn.ConvTranspose2d(ni * 2, nf, kernel_size=4, stride=2, padding=1)
+            down = [down_convolution]
+            up = [up_relu, up_convolution, nn.Tanh()]
             model = down + [submodule] + up
         elif innermost:
-            upconv = nn.ConvTranspose2d(ni, nf, kernel_size=4, stride=2, padding=1, bias=False)
-            down = [downrelu, downconv]
-            up = [uprelu, upconv, upnorm]
+            up_convolution = nn.ConvTranspose2d(ni, nf, kernel_size=4, stride=2, padding=1, bias=False)
+            down = [down_relu, down_convolution]
+            up = [up_relu, up_convolution, up_norm]
             model = down + up
         else:
-            upconv = nn.ConvTranspose2d(ni * 2, nf, kernel_size=4,
-                                        stride=2, padding=1, bias=False)
-            down = [downrelu, downconv, downnorm]
-            up = [uprelu, upconv, upnorm]
-            if dropout: up += [nn.Dropout(0.5)]
+            up_convolution = nn.ConvTranspose2d(ni * 2, nf, kernel_size=4, stride=2, padding=1, bias=False)
+            down = [down_relu, down_convolution, down_normalization]
+            up = [up_relu, up_convolution, up_norm]
+            if dropout:
+                up += [nn.Dropout(0.5)]
             model = down + [submodule] + up
         self.model = nn.Sequential(*model)
 
@@ -43,40 +42,42 @@ def forward(self, x):
 
 
 class Unet(nn.Module):
-    def __init__(self, input_c=1, output_c=2, n_down=8, num_filters=64):
+    def __init__(self, nfg=64):
         super().__init__()
-        unet_block = UnetBlock(num_filters * 8, num_filters * 8, innermost=True)
-        for _ in range(n_down - 5):
-            unet_block = UnetBlock(num_filters * 8, num_filters * 8, submodule=unet_block, dropout=True)
-        out_filters = num_filters * 8
+        unet_block = UnetBlock(nfg * 8, nfg * 8, innermost=True)
+        for _ in range(3):
+            unet_block = UnetBlock(nfg * 8, nfg * 8, submodule=unet_block, dropout=True)
+        out_filters = nfg * 8
         for _ in range(3):
             unet_block = UnetBlock(out_filters // 2, out_filters, submodule=unet_block)
             out_filters //= 2
-        self.model = UnetBlock(output_c, out_filters, input_c=input_c, submodule=unet_block, outermost=True)
+        self.model = UnetBlock(2, out_filters, input_channels=1, submodule=unet_block, outermost=True)
 
     def forward(self, x):
         return self.model(x)
 
 
 class PatchDiscriminator(nn.Module):
-    def __init__(self, input_c, num_filters=64, n_down=3):
+    def __init__(self, nfd=64):
         super().__init__()
-        model = [self.get_layers(input_c, num_filters, norm=False)]
-        model += [self.get_layers(num_filters * 2 ** i, num_filters * 2 ** (i + 1), s=1 if i == (n_down - 1) else 2)
-                  for i in range(n_down)]  # the 'if' statement is taking care of not using
-        # stride of 2 for the last block in this loop
-        model += [self.get_layers(num_filters * 2 ** n_down, 1, s=1, norm=False,
-                                  act=False)]  # Make sure to not use normalization or
-        # activation for the last layer of the model
-        self.model = nn.Sequential(*model)
+        self.model = nn.Sequential(
+            nn.Conv2d(3, nfd, 4, 2, 1, bias=True),
+            nn.LeakyReLU(0.2, True),
+
+            nn.Conv2d(nfd, nfd * 2, 4, 2, 1, bias=False),
+            nn.BatchNorm2d(nfd * 2),
+            nn.LeakyReLU(0.2, True),
+
+            nn.Conv2d(nfd * 2, nfd * 4, 4, 2, 1, bias=False),
+            nn.BatchNorm2d(nfd * 4),
+            nn.LeakyReLU(0.2, True),
+
+            nn.Conv2d(nfd * 4, nfd * 8, 4, 1, 1, bias=False),
+            nn.BatchNorm2d(nfd * 8),
+            nn.LeakyReLU(0.2, True),
 
-    def get_layers(self, ni, nf, k=4, s=2, p=1, norm=True,
-                   act=True):  # when needing to make some repeatitive blocks of layers,
-        layers = [
-            nn.Conv2d(ni, nf, k, s, p, bias=not norm)]  # it's always helpful to make a separate method for that purpose
-        if norm: layers += [nn.BatchNorm2d(nf)]
-        if act: layers += [nn.LeakyReLU(0.2, True)]
-        return nn.Sequential(*layers)
+            nn.Conv2d(nfd * 8, nfd * 16, 4, 1, 1, bias=True),
+        )
 
     def forward(self, x):
         return self.model(x)
@@ -111,21 +112,27 @@ def init_model(model, device):
 
 
 class MainModel(nn.Module):
-    def __init__(self, net_G=None, lr_G=2e-4, lr_D=2e-4, beta1=0.5, beta2=0.999, lambda_L1=100.):
+    def __init__(self,
+                 net_generator=None,
+                 lr_generator=2e-4,
+                 lr_discriminator=2e-4,
+                 beta1=0.5,
+                 beta2=0.999,
+                 lambda_l1=100.):
         super().__init__()
 
         self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-        self.lambda_L1 = lambda_L1
+        self.lambda_L1 = lambda_l1
 
-        if net_G is None:
-            self.net_G = init_model(Unet(input_c=1, output_c=2, n_down=8, num_filters=64), self.device)
+        if net_generator is None:
+            self.net_G = init_model(Unet(nfg=64), self.device)
         else:
-            self.net_G = net_G.to(self.device)
-        self.net_D = init_model(PatchDiscriminator(input_c=3, n_down=3, num_filters=64), self.device)
-        self.GANcriterion = GANLoss(gan_mode='vanilla').to(self.device)
-        self.L1criterion = nn.L1Loss()
-        self.opt_G = optim.Adam(self.net_G.parameters(), lr=lr_G, betas=(beta1, beta2))
-        self.opt_D = optim.Adam(self.net_D.parameters(), lr=lr_D, betas=(beta1, beta2))
+            self.net_G = net_generator.to(self.device)
+        self.net_D = init_model(PatchDiscriminator(nfd=64), self.device)
+        self.GAN_criterion = GANLoss(gan_mode='vanilla').to(self.device)
+        self.L1_criterion = nn.L1Loss()
+        self.opt_G = optim.Adam(self.net_G.parameters(), lr=lr_generator, betas=(beta1, beta2))
+        self.opt_D = optim.Adam(self.net_D.parameters(), lr=lr_discriminator, betas=(beta1, beta2))
 
     def set_requires_grad(self, model, requires_grad=True):
         for p in model.parameters():
@@ -140,19 +147,19 @@ def forward(self):
 
     def backward_D(self):
         fake_image = torch.cat([self.L, self.fake_color], dim=1)
-        fake_preds = self.net_D(fake_image.detach())
-        self.loss_D_fake = self.GANcriterion(fake_preds, False)
+        fake_predictions = self.net_D(fake_image.detach())
+        self.loss_D_fake = self.GAN_criterion(fake_predictions, False)
         real_image = torch.cat([self.L, self.ab], dim=1)
-        real_preds = self.net_D(real_image)
-        self.loss_D_real = self.GANcriterion(real_preds, True)
+        real_predictions = self.net_D(real_image)
+        self.loss_D_real = self.GAN_criterion(real_predictions, True)
         self.loss_D = (self.loss_D_fake + self.loss_D_real) * 0.5
         self.loss_D.backward()
 
     def backward_G(self):
         fake_image = torch.cat([self.L, self.fake_color], dim=1)
-        fake_preds = self.net_D(fake_image)
-        self.loss_G_GAN = self.GANcriterion(fake_preds, True)
-        self.loss_G_L1 = self.L1criterion(self.fake_color, self.ab) * self.lambda_L1
+        fake_predictions = self.net_D(fake_image)
+        self.loss_G_GAN = self.GAN_criterion(fake_predictions, True)
+        self.loss_G_L1 = self.L1_criterion(self.fake_color, self.ab) * self.lambda_L1
         self.loss_G = self.loss_G_GAN + self.loss_G_L1
         self.loss_G.backward()