Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

GAN Models #55

Merged
merged 5 commits into from
Jul 5, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Empty file removed GAN/Algorithms/.gitkeep
Empty file.
159 changes: 159 additions & 0 deletions GAN/Algorithms/ACGAN/ACGAN.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,159 @@
import torch
import torch.nn as nn
import torch.optim as optim
import torchvision.datasets as dsets
import torchvision.transforms as transforms
from torch.utils.data import DataLoader
import matplotlib.pyplot as plt
import numpy as np

# Device configuration
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

# Hyper-parameters
image_size = 28 * 28
num_classes = 10
latent_size = 100
hidden_size = 256
num_epochs = 100
batch_size = 64
learning_rate = 0.0002

# MNIST dataset
transform = transforms.Compose([
transforms.ToTensor(),
transforms.Normalize(mean=(0.5,), std=(0.5,))
])

train_dataset = dsets.MNIST(root='../data/',
train=True,
transform=transform,
download=True)

train_loader = DataLoader(dataset=train_dataset,
batch_size=batch_size,
shuffle=True)

# Discriminator
class Discriminator(nn.Module):
def __init__(self):
super(Discriminator, self).__init__()
self.label_emb = nn.Embedding(num_classes, num_classes)

self.model = nn.Sequential(
nn.Linear(image_size + num_classes, hidden_size),
nn.LeakyReLU(0.2),
nn.Dropout(0.3),
nn.Linear(hidden_size, hidden_size),
nn.LeakyReLU(0.2),
nn.Dropout(0.3),
nn.Linear(hidden_size, 1),
nn.Sigmoid()
)

def forward(self, x, labels):
x = x.view(x.size(0), image_size)
c = self.label_emb(labels)
x = torch.cat([x, c], 1)
out = self.model(x)
return out

# Generator
class Generator(nn.Module):
def __init__(self):
super(Generator, self).__init__()
self.label_emb = nn.Embedding(num_classes, num_classes)

self.model = nn.Sequential(
nn.Linear(latent_size + num_classes, hidden_size),
nn.ReLU(),
nn.Linear(hidden_size, hidden_size),
nn.ReLU(),
nn.Linear(hidden_size, image_size),
nn.Tanh()
)

def forward(self, z, labels):
z = z.view(z.size(0), latent_size)
c = self.label_emb(labels)
x = torch.cat([z, c], 1)
out = self.model(x)
return out

# Initialize models
D = Discriminator().to(device)
G = Generator().to(device)

# Loss function and optimizer
criterion = nn.BCELoss()
d_optimizer = optim.Adam(D.parameters(), lr=learning_rate)
g_optimizer = optim.Adam(G.parameters(), lr=learning_rate)

# Utility functions
def denorm(x):
out = (x + 1) / 2
return out.clamp(0, 1)

def create_noise(batch_size, latent_size):
return torch.randn(batch_size, latent_size).to(device)

def create_labels(batch_size):
return torch.randint(0, num_classes, (batch_size,)).to(device)

# Training the ACGAN
total_step = len(train_loader)
for epoch in range(num_epochs):
for i, (images, labels) in enumerate(train_loader):
batch_size = images.size(0)
images = images.to(device)
labels = labels.to(device)

# Create the labels which are later used as input for the discriminator
real_labels = torch.ones(batch_size, 1).to(device)
fake_labels = torch.zeros(batch_size, 1).to(device)

# ================================================================== #
# Train the discriminator #
# ================================================================== #

# Compute BCELoss using real images
outputs = D(images, labels)
d_loss_real = criterion(outputs, real_labels)
real_score = outputs

# Compute BCELoss using fake images
z = create_noise(batch_size, latent_size)
fake_images = G(z, labels)
outputs = D(fake_images, labels)
d_loss_fake = criterion(outputs, fake_labels)
fake_score = outputs

# Backprop and optimize
d_loss = d_loss_real + d_loss_fake
D.zero_grad()
d_loss.backward()
d_optimizer.step()

# ================================================================== #
# Train the generator #
# ================================================================== #

# Compute loss with fake images
z = create_noise(batch_size, latent_size)
fake_images = G(z, labels)
outputs = D(fake_images, labels)

# We train G to maximize log(D(G(z)))
g_loss = criterion(outputs, real_labels)

# Backprop and optimize
G.zero_grad()
g_loss.backward()
g_optimizer.step()

if (i+1) % 200 == 0:
print(f'Epoch [{epoch}/{num_epochs}], Step [{i+1}/{total_step}], d_loss: {d_loss.item():.4f}, g_loss: {g_loss.item():.4f}, D(x): {real_score.mean().item():.2f}, D(G(z)): {fake_score.mean().item():.2f}')

# Save the trained models
torch.save(G.state_dict(), 'G_acgan.pth')
torch.save(D.state_dict(), 'D_acgan.pth')
64 changes: 64 additions & 0 deletions GAN/Algorithms/ACGAN/README.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,64 @@
# Auxiliary Classifier Generative Adversarial Network (ACGAN)

----

This folder contains an implementation of an Auxiliary Classifier Generative Adversarial Network (ACGAN) using PyTorch. ACGAN extends the traditional GAN architecture by incorporating class information into both the generator and discriminator, allowing control over the generated samples' characteristics.

----

## Overview

ACGANs are capable of generating high-quality images conditioned on specific classes. In addition to generating images, the discriminator in ACGAN also predicts the class labels of the generated images. This allows for more controlled and targeted image synthesis.

----

## Usage

To use this implementation, follow these steps:

1. **Clone the repository**:
```bash
git clone https://github.com/UTSAVS26/GAN-models.git
cd GAN_models/ACGAN
```

2. **Install dependencies**:
Make sure you have Python 3 and pip installed. Then install the required dependencies:
```bash
pip install -r requirements.txt
```
This will install PyTorch, torchvision, matplotlib, and numpy.

3. **Train the ACGAN**:
Run the `ACGAN.py` script to train the ACGAN model. This will train the ACGAN on the MNIST dataset and save the trained models (`G_acgan.pth` and `D_acgan.pth`).
```bash
python ACGAN.py
```

4. **Generate new images**:
After training, you can generate new images using the trained generator by running the `test_ACGAN.py` script.
```bash
python test_ACGAN.py


```
This script loads the trained generator model and generates a grid of sample images.

----

## Files

- `ACGAN.py`: Contains the implementation of the ACGAN model, training loop, and saving of trained models.
- `test_ACGAN.py`: Uses the trained generator to generate sample images after training.

## Contributing

Contributions are welcome! If you have ideas for improvements or new features, feel free to open an issue or submit a pull request.

## Author

- [Utsav Singhal](https://github.com/UTSAVS26)

---

### Happy Generating with ACGAN! 🎨
68 changes: 68 additions & 0 deletions GAN/Algorithms/ACGAN/tests/test_ACGAN.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,68 @@
import torch
import torch.nn as nn
import matplotlib.pyplot as plt
import numpy as np

# Device configuration
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

# Hyper-parameters
latent_size = 100
num_classes = 10
image_size = 28 * 28

# Generator
class Generator(nn.Module):
def __init__(self):
super(Generator, self).__init__()
self.label_emb = nn.Embedding(num_classes, num_classes)

self.model = nn.Sequential(
nn.Linear(latent_size + num_classes, 256),
nn.ReLU(),
nn.Linear(256, 512),
nn.ReLU(),
nn.Linear(512, image_size),
nn.Tanh()
)

def forward(self, z, labels):
z = z.view(z.size(0), latent_size)
c = self.label_emb(labels)
x = torch.cat([z, c], 1)
out = self.model(x)
return out

# Load the trained generator model
G = Generator()
G.load_state_dict(torch.load('G_acgan.pth', map_location=torch.device('cpu')))
G.eval()

# Utility function to generate random noise
def create_noise(size, latent_dim):
return torch.randn(size, latent_dim)

# Utility function to generate labels
def create_labels(size):
return torch.randint(0, num_classes, (size,))

# Utility function to denormalize the images
def denorm(x):
out = (x + 1) / 2
return out.clamp(0, 1)

# Generate images
with torch.no_grad():
noise = create_noise(64, latent_size)
labels = create_labels(64)
fake_images = G(noise, labels)
fake_images = fake_images.reshape(fake_images.size(0), 1, 28, 28)
fake_images = denorm(fake_images)
grid = np.transpose(fake_images, (0, 2, 3, 1)).numpy()

plt.figure(figsize=(8, 8))
for i in range(grid.shape[0]):
plt.subplot(8, 8, i+1)
plt.imshow(grid[i, :, :, 0], cmap='gray')
plt.axis('off')
plt.show()
Loading