%matplotlib inline

import matplotlib.pyplot as plt
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
import torch.utils.data
from torchvision import datasets, transforms

!wget www.di.ens.fr/~lelarge/MNIST.tar.gz
!tar -zxvf MNIST.tar.gz

/usr/lib/python3.10/pty.py:89: RuntimeWarning: os.fork() was called. os.fork() is incompatible with multithreaded code, and JAX is multithreaded, so this will likely lead to a deadlock.
  pid, fd = os.forkpty()

--2024-03-25 20:22:02--  http://www.di.ens.fr/~lelarge/MNIST.tar.gz
Resolving www.di.ens.fr (www.di.ens.fr)... 129.199.99.14
Connecting to www.di.ens.fr (www.di.ens.fr)|129.199.99.14|:80... connected.
HTTP request sent, awaiting response... 302 Found
Location: https://www.di.ens.fr/~lelarge/MNIST.tar.gz [following]
--2024-03-25 20:22:03--  https://www.di.ens.fr/~lelarge/MNIST.tar.gz
Connecting to www.di.ens.fr (www.di.ens.fr)|129.199.99.14|:443... connected.
HTTP request sent, awaiting response... 200 OK
Length: unspecified [application/x-gzip]
Saving to: ‘MNIST.tar.gz’

MNIST.tar.gz            [                <=> ]  33.20M  3.78MB/s    in 11s     

2024-03-25 20:22:14 (3.10 MB/s) - ‘MNIST.tar.gz’ saved [34813078]

MNIST/
MNIST/raw/
MNIST/raw/train-labels-idx1-ubyte
MNIST/raw/t10k-labels-idx1-ubyte.gz
MNIST/raw/t10k-labels-idx1-ubyte
MNIST/raw/t10k-images-idx3-ubyte.gz
MNIST/raw/train-images-idx3-ubyte
MNIST/raw/train-labels-idx1-ubyte.gz
MNIST/raw/t10k-images-idx3-ubyte
MNIST/raw/train-images-idx3-ubyte.gz
MNIST/processed/
MNIST/processed/training.pt
MNIST/processed/test.pt

mnist_data = datasets.MNIST('./', train=True, download=True, transform=transforms.ToTensor())

class Discriminator(nn.Module):
    def __init__(self):
        super().__init__()
        self.model = nn.Sequential(
            nn.Linear(28*28, 300),
            nn.LeakyReLU(0.2, inplace=True),
            nn.Linear(300, 100),
            nn.LeakyReLU(0.2, inplace=True),
            nn.Linear(100, 1)
        )

    def forward(self, x):
        x = x.view(x.size(0), -1)
        out = self.model(x)
        return out.view(x.size(0))

class Generator(nn.Module):
    def __init__(self):
        super().__init__()
        self.model = nn.Sequential(
            nn.Linear(100, 300),
            nn.LeakyReLU(0.2, inplace=True),
            nn.Linear(300, 28*28),
            nn.Sigmoid()
        )

    def forward(self, x):
        out = self.model(x).view(x.size(0), 1, 28, 28)
        return out

# Discuss the answers with your tutorial group

# Discuss the answers with your tutorial group

# Discuss the answers with your tutorial group

def train(generator, discriminator, device, lr=0.001, num_epochs=5):
    # We will use the binary cross-entropy loss
    criterion = nn.BCEWithLogitsLoss()

    # From: https://colab.research.google.com/github/smartgeometry-ucl/dl4g/blob/master/gan.ipynb#scrollTo=-o7DOryPkUOb
    # GAN training can be unstable. In this case, the strong momentum
    # for the gradient prevents convergence. One possible explanation is that the
    # strong momentum does not allow the two players in the adversarial game to react
    # to each other quickly enough. Decreasing beta1 (the exponential decay for the
    # gradient moving average in [0,1], lower is faster decay) from the default 0.9
    # to 0.5 allows for quicker reactions.
    d_optimizer = torch.optim.Adam(discriminator.parameters(), lr=lr, betas=(0.5, 0.999))
    g_optimizer = torch.optim.Adam(generator.parameters(), lr=lr, betas=(0.5, 0.999))

    # Use the MNIST data as training data
    train_loader = torch.utils.data.DataLoader(mnist_data, batch_size=100, shuffle=True)

    # We will track 16 noise vectors, and what image the generator creates
    # from these 16 noise vectors.
    num_test_samples = 16
    test_noise = torch.randn(num_test_samples, 100).to(device)

    # Move generator and discriminator weights to the GPU
    generator = generator.to(device)
    discriminator = discriminator.to(device)

    for epoch in range(num_epochs):
        # put the generator/discriminator in training mode
        generator.train()
        discriminator.train()

        for n, (images, _) in enumerate(train_loader):
            # === Train the Discriminator ===
            noise = torch.randn(images.size(0), 100).to(device)
            fake_images = generator(noise)
            inputs = torch.cat([images.to(device), fake_images])
            labels = None # TODO: Create a vector denoting that the real images
                          #       should have label 1, and fake images should have label 0

            d_outputs = discriminator(inputs)
            d_loss = criterion(d_outputs, labels.to(device))
            d_optimizer.zero_grad()
            d_loss.backward()
            d_optimizer.step()

            # === Train the Generator ===
            noise = torch.randn(images.size(0), 100)
            fake_images = generator(noise.to(device))
            outputs = discriminator(fake_images.to(device))

            g_loss = criterion(outputs,
                               None) # TODO: what should this be?
            g_optimizer.zero_grad()
            g_loss.backward()
            g_optimizer.step()

        # Report the average scores
        scores = torch.sigmoid(d_outputs)
        real_score = scores[:images.size(0)].data.mean()
        fake_score = scores[images.size(0):].data.mean()

        print('Epoch [%d/%d], d_loss: %.4f, g_loss: %.4f, ' 
              'D(x): %.2f, D(G(z)): %.2f' 
              % (epoch + 1, num_epochs, d_loss.item(), g_loss.item(), real_score, fake_score))
        
        # Plot images generated from the 16 noise vectors
        generator.eval()
        discriminator.eval()
        test_images = generator(test_noise).cpu()
        plt.figure(figsize=(9, 3))
        for k in range(16):
            plt.subplot(2, 8, k+1)
            plt.imshow(test_images[k,:].data.numpy().reshape(28, 28), cmap='Greys')
        plt.show()

discriminator = Discriminator()
generator = Generator()

device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
#train(generator, discriminator, device, lr=0.0002, num_epochs=20)

# Discuss the answers with your tutorial group

# Discuss the answers with your tutorial group

Generative Adversarial Networks¶

Q1. Model¶

Part (a)¶

Part (b)¶

Part (c)¶

Q1. Training a GAN¶

Part (a)¶

Part (b)¶

Part (c)¶

Part (d)¶

Other GAN Implementations¶