added functinality to save weights,

caffeine-coder1 · caffeine-coder1 · commit 8eff864240f1 · 2021-06-18T13:18:50.000+05:30
based on the loss.
 removed the reshape function as the output of the model is,
 as per the requirment.
diff --git a/GAN/DCGAN/training.py b/GAN/DCGAN/training.py
@@ -6,112 +6,132 @@
 from torch.utils.data import DataLoader
 from model import Discriminator, Faker
 from torch.utils.tensorboard import SummaryWriter
+from pathlib import Path
 
 
-# ~~~~~~~~~~~~~~~~~~~ hyper parameters ~~~~~~~~~~~~~~~~~~~ #
-EPOCHS = 20
-CHANNELS = 1
-H, W = 64, 64
-IMG_SIZE = CHANNELS * H * W
-lr = 2e-4
-work_device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
-FEATURE_D = 128
-Z_DIM = 100
-GEN_TRAIN_STEPS = 5
-BATCH_SIZE = 128
-# ~~~~~~~~~~~~~~~~~~~ loading the dataset ~~~~~~~~~~~~~~~~~~~ #
+if __name__ == "__main__":
 
-trans = transforms.Compose(
-    [transforms.Resize((H, W)), transforms.ToTensor(), transforms.Normalize((0.5,), (0.5,))])
+    # ~~~~~~~~~~~~~~~~~~~ hyper parameters ~~~~~~~~~~~~~~~~~~~ #
+    EPOCHS = 20
+    CHANNELS = 1
+    H, W = 64, 64
+    IMG_SIZE = CHANNELS * H * W
+    lr = 2e-4
+    work_device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+    FEATURE_D = 128
+    Z_DIM = 100
+    GEN_TRAIN_STEPS = 5
+    BATCH_SIZE = 128
+    Weight_dir = Path('/weights').resolve()
+    if not Weight_dir.exists():
+        Weight_dir.mkdir()
+    # ~~~~~~~~~~~~~~~~~~~ loading the dataset ~~~~~~~~~~~~~~~~~~~ #
 
-MNIST_data = MNIST('./data', True, transform=trans, download=True)
+    trans = transforms.Compose(
+        [transforms.Resize((H, W)), transforms.ToTensor(), transforms.Normalize((0.5,), (0.5,))])
 
-loader = DataLoader(MNIST_data, BATCH_SIZE, True, num_workers=1)
+    MNIST_data = MNIST('./data', True, transform=trans, download=True)
 
-# ~~~~~~~~~~~~~~~~~~~ creating tensorboard variables ~~~~~~~~~~~~~~~~~~~ #
+    loader = DataLoader(MNIST_data, BATCH_SIZE, True, num_workers=1)
 
-writer_fake = SummaryWriter("logs/fake")
-writer_real = SummaryWriter("logs/real")
+    # ~~~~~~~~~~~~~~~~~~~ creating tensorboard variables ~~~~~~~~~~~~~~~~~~~ #
 
-# ~~~~~~~~~~~~~~~~~~~ loading the model ~~~~~~~~~~~~~~~~~~~ #
+    writer_fake = SummaryWriter("logs/fake")
+    writer_real = SummaryWriter("logs/real")
 
-disc = Discriminator(img_channels=CHANNELS,
-                     feature_d=FEATURE_D).to(work_device)
-gen = Faker(Z_DIM, CHANNELS, FEATURE_D).to(work_device)
+    # ~~~~~~~~~~~~~~~~~~~ loading the model ~~~~~~~~~~~~~~~~~~~ #
 
-# ~~~~~~~~~~~~~~~~~~~ create optimizer and loss ~~~~~~~~~~~~~~~~~~~ #
+    disc = Discriminator(img_channels=CHANNELS,
+                         feature_d=FEATURE_D).to(work_device)
+    gen = Faker(Z_DIM, CHANNELS, FEATURE_D).to(work_device)
 
-disc_optim = optim.Adam(disc.parameters(), lr, (0.5, 0.999))
-gen_optim = optim.Adam(gen.parameters(), lr, (0.5, 0.999))
-criterion = torch.nn.BCELoss()
+    # ~~~~~~~~~~~~~~~~~~~ create optimizer and loss ~~~~~~~~~~~~~~~~~~~ #
 
-# ~~~~~~~~~~~~~~~~~~~ training loop ~~~~~~~~~~~~~~~~~~~ #
+    disc_optim = optim.Adam(disc.parameters(), lr, (0.5, 0.999))
+    gen_optim = optim.Adam(gen.parameters(), lr, (0.5, 0.999))
+    criterion = torch.nn.BCELoss()
 
-for epoch in range(EPOCHS):
+    # ~~~~~~~~~~~~~~~~~~~ training loop ~~~~~~~~~~~~~~~~~~~ #
 
-    for batch_idx, (real, _) in enumerate(loader):
-        disc.train()
-        gen.train()
-        real = real.to(work_device)
-        fixed_noise = torch.rand(real.shape[0], Z_DIM, H, W).to(work_device)
-        # ~~~~~~~~~~~~~~~~~~~ discriminator loop ~~~~~~~~~~~~~~~~~~~ #
+    for epoch in range(EPOCHS):
+        D_loss_prev = inf
+        G_loss_prev = inf
 
-        fake = gen(fixed_noise)  # dim of (N,1,28,28)
-        # ~~~~~~~~~~~~~~~~~~~ forward ~~~~~~~~~~~~~~~~~~~ #
-        real_predict = disc(real).view(-1)  # make it one dimensional array
-        fake_predict = disc(fake).view(-1)  # make it one dimensional array
+        for batch_idx, (real, _) in enumerate(loader):
+            disc.train()
+            gen.train()
+            real = real.to(work_device)
+            fixed_noise = torch.rand(
+                real.shape[0], Z_DIM, 1, 1).to(work_device)
+            # ~~~~~~~~~~~~~~~~~~~ discriminator loop ~~~~~~~~~~~~~~~~~~~ #
 
-        labels = torch.cat([torch.ones_like(real_predict),
-                            torch.zeros_like(fake_predict)], dim=0)
-
-        # ~~~~~~~~~~~~~~~~~~~ loss ~~~~~~~~~~~~~~~~~~~ #
-        D_loss = criterion(
-            torch.cat([real_predict, fake_predict], dim=0), labels)
-
-        # ~~~~~~~~~~~~~~~~~~~ backward ~~~~~~~~~~~~~~~~~~~ #
-        disc.zero_grad()
-        D_loss.backward()
-        disc_optim.step()
-
-        # ~~~~~~~~~~~~~~~~~~~ generator loop ~~~~~~~~~~~~~~~~~~~ #
-        for _ in range(GEN_TRAIN_STEPS):
-            # ~~~~~~~~~~~~~~~~~~~ forward ~~~~~~~~~~~~~~~~~~~ #
-            fake = gen(fixed_noise).view(-1, CHANNELS,
-                                         H, W)  # dim of (N,1,32,32)
+            fake = gen(fixed_noise)  # dim of (N,1,28,28)
             # ~~~~~~~~~~~~~~~~~~~ forward ~~~~~~~~~~~~~~~~~~~ #
+            real_predict = disc(real).view(-1)  # make it one dimensional array
             fake_predict = disc(fake).view(-1)  # make it one dimensional array
+
+            labels = torch.cat([torch.ones_like(real_predict),
+                                torch.zeros_like(fake_predict)], dim=0)
+
             # ~~~~~~~~~~~~~~~~~~~ loss ~~~~~~~~~~~~~~~~~~~ #
+            D_loss = criterion(
+                torch.cat([real_predict, fake_predict], dim=0), labels)
 
-            G_loss = criterion(fake_predict, torch.ones_like(fake_predict))
             # ~~~~~~~~~~~~~~~~~~~ backward ~~~~~~~~~~~~~~~~~~~ #
-            gen.zero_grad()
-            G_loss.backward()
-            gen_optim.step()
-
-        # ~~~~~~~~~~~~~~~~~~~ loading the tensorboard ~~~~~~~~~~~~~~~~~~~ #
-
-        if batch_idx == 0:
-            print(
-                f"Epoch [{epoch}/{EPOCHS}] Batch {batch_idx}/{len(loader)} \
-                            Loss D: {D_loss:.4f}, loss G: {G_loss:.4f}"
-            )
-
-            with torch.no_grad():
-                disc.eval()
-                gen.eval()
-                fake = gen(fixed_noise).reshape(-1, CHANNELS, H, W)
-                data = real.reshape(-1, CHANNELS, H, W)
-                if BATCH_SIZE > 32:
-                    fake = fake[:32]
-                    data = data[:32]
-                img_grid_fake = torchvision.utils.make_grid(
-                    fake, normalize=True)
-                img_grid_real = torchvision.utils.make_grid(
-                    data, normalize=True)
-
-                writer_fake.add_image(
-                    "Mnist Fake Images", img_grid_fake, global_step=epoch
-                )
-                writer_real.add_image(
-                    "Mnist Real Images", img_grid_real, global_step=epoch
+            disc.zero_grad()
+            D_loss.backward()
+            disc_optim.step()
+
+            # ~~~~~~~~~~~~~~~~~~~ generator loop ~~~~~~~~~~~~~~~~~~~ #
+            for _ in range(GEN_TRAIN_STEPS):
+                # ~~~~~~~~~~~~~~~~~~~ forward ~~~~~~~~~~~~~~~~~~~ #
+                fake = gen(fixed_noise)
+                # ~~~~~~~~~~~~~~~~~~~ forward ~~~~~~~~~~~~~~~~~~~ #
+                # make it one dimensional array
+                fake_predict = disc(fake).view(-1)
+                # ~~~~~~~~~~~~~~~~~~~ loss ~~~~~~~~~~~~~~~~~~~ #
+
+                G_loss = criterion(fake_predict, torch.ones_like(fake_predict))
+                # ~~~~~~~~~~~~~~~~~~~ backward ~~~~~~~~~~~~~~~~~~~ #
+                gen.zero_grad()
+                G_loss.backward()
+                gen_optim.step()
+
+            # ~~~~~~~~~~~~~~~~~~~ loading the tensorboard ~~~~~~~~~~~~~~~~~~~ #
+
+            if batch_idx == 0:
+                print(
+                    f"Epoch [{epoch}/{EPOCHS}] Batch {batch_idx}/{len(loader)} \
+                                Loss D: {D_loss:.4f}, loss G: {G_loss:.4f}"
                 )
+
+                with torch.no_grad():
+                    disc.eval()
+                    gen.eval()
+                    fake = gen(fixed_noise).reshape(-1, CHANNELS, H, W)
+                    data = real.reshape(-1, CHANNELS, H, W)
+                    if BATCH_SIZE > 32:
+                        fake = fake[:32]
+                        data = data[:32]
+                    img_grid_fake = torchvision.utils.make_grid(
+                        fake, normalize=True)
+                    img_grid_real = torchvision.utils.make_grid(
+                        data, normalize=True)
+
+                    writer_fake.add_image(
+                        "Mnist Fake Images", img_grid_fake, global_step=epoch
+                    )
+                    writer_real.add_image(
+                        "Mnist Real Images", img_grid_real, global_step=epoch
+                    )
+
+        # ~~~~~~~~~~~~~~~~~~~ saving the weights ~~~~~~~~~~~~~~~~~~~ #
+        if D_loss_prev > D_loss:
+            D_loss_prev = D_loss
+            weight_path = str(Weight_dir/'dirscriminator.pth')
+            torch.save(disc.state_dict(), weight_path)
+
+        if G_loss_prev > G_loss:
+            G_loss_prev = G_loss
+            weight_path = str(Weight_dir/'generator.pth')
+            torch.save(gen.state_dict(), weight_path)