-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathdcgan_commented.py
144 lines (116 loc) · 9.78 KB
/
dcgan_commented.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
# Deep Convolutional GANs
# Importing the libraries
from __future__ import print_function
import torch
import torch.nn as nn
import torch.nn.parallel
import torch.optim as optim
import torch.utils.data
import torchvision.datasets as dset
import torchvision.transforms as transforms
import torchvision.utils as vutils
from torch.autograd import Variable
# Setting some hyperparameters
batchSize = 64 # We set the size of the batch.
imageSize = 64 # We set the size of the generated images (64x64).
# Creating the transformations
transform = transforms.Compose([transforms.Scale(imageSize), transforms.ToTensor(), transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5)),]) # We create a list of transformations (scaling, tensor conversion, normalization) to apply to the input images.
# Loading the dataset
dataset = dset.CIFAR10(root = './data', download = True, transform = transform) # We download the training set in the ./data folder and we apply the previous transformations on each image.
dataloader = torch.utils.data.DataLoader(dataset, batch_size = batchSize, shuffle = True, num_workers = 2) # We use dataLoader to get the images of the training set batch by batch.
# Defining the weights_init function that takes as input a neural network m and that will initialize all its weights.
def weights_init(m):
classname = m.__class__.__name__
if classname.find('Conv') != -1:
m.weight.data.normal_(0.0, 0.02)
elif classname.find('BatchNorm') != -1:
m.weight.data.normal_(1.0, 0.02)
m.bias.data.fill_(0)
# Defining the generator
class G(nn.Module): # We introduce a class to define the generator.
def __init__(self): # We introduce the __init__() function that will define the architecture of the generator.
super(G, self).__init__() # We inherit from the nn.Module tools.
self.main = nn.Sequential( # We create a meta module of a neural network that will contain a sequence of modules (convolutions, full connections, etc.).
nn.ConvTranspose2d(100, 512, 4, 1, 0, bias = False), # We start with an inversed convolution.
nn.BatchNorm2d(512), # We normalize all the features along the dimension of the batch.
nn.ReLU(True), # We apply a ReLU rectification to break the linearity.
nn.ConvTranspose2d(512, 256, 4, 2, 1, bias = False), # We add another inversed convolution.
nn.BatchNorm2d(256), # We normalize again.
nn.ReLU(True), # We apply another ReLU.
nn.ConvTranspose2d(256, 128, 4, 2, 1, bias = False), # We add another inversed convolution.
nn.BatchNorm2d(128), # We normalize again.
nn.ReLU(True), # We apply another ReLU.
nn.ConvTranspose2d(128, 64, 4, 2, 1, bias = False), # We add another inversed convolution.
nn.BatchNorm2d(64), # We normalize again.
nn.ReLU(True), # We apply another ReLU.
nn.ConvTranspose2d(64, 3, 4, 2, 1, bias = False), # We add another inversed convolution.
nn.Tanh() # We apply a Tanh rectification to break the linearity and stay between -1 and +1.
)
def forward(self, input): # We define the forward function that takes as argument an input that will be fed to the neural network, and that will return the output containing the generated images.
output = self.main(input) # We forward propagate the signal through the whole neural network of the generator defined by self.main.
return output # We return the output containing the generated images.
# Creating the generator
netG = G() # We create the generator object.
netG.apply(weights_init) # We initialize all the weights of its neural network.
# Defining the discriminator
class D(nn.Module): # We introduce a class to define the discriminator.
def __init__(self): # We introduce the __init__() function that will define the architecture of the discriminator.
super(D, self).__init__() # We inherit from the nn.Module tools.
self.main = nn.Sequential( # We create a meta module of a neural network that will contain a sequence of modules (convolutions, full connections, etc.).
nn.Conv2d(3, 64, 4, 2, 1, bias = False), # We start with a convolution.
nn.LeakyReLU(0.2, inplace = True), # We apply a LeakyReLU.
nn.Conv2d(64, 128, 4, 2, 1, bias = False), # We add another convolution.
nn.BatchNorm2d(128), # We normalize all the features along the dimension of the batch.
nn.LeakyReLU(0.2, inplace = True), # We apply another LeakyReLU.
nn.Conv2d(128, 256, 4, 2, 1, bias = False), # We add another convolution.
nn.BatchNorm2d(256), # We normalize again.
nn.LeakyReLU(0.2, inplace = True), # We apply another LeakyReLU.
nn.Conv2d(256, 512, 4, 2, 1, bias = False), # We add another convolution.
nn.BatchNorm2d(512), # We normalize again.
nn.LeakyReLU(0.2, inplace = True), # We apply another LeakyReLU.
nn.Conv2d(512, 1, 4, 1, 0, bias = False), # We add another convolution.
nn.Sigmoid() # We apply a Sigmoid rectification to break the linearity and stay between 0 and 1.
)
def forward(self, input): # We define the forward function that takes as argument an input that will be fed to the neural network, and that will return the output which will be a value between 0 and 1.
output = self.main(input) # We forward propagate the signal through the whole neural network of the discriminator defined by self.main.
return output.view(-1) # We return the output which will be a value between 0 and 1.
# Creating the discriminator
netD = D() # We create the discriminator object.
netD.apply(weights_init) # We initialize all the weights of its neural network.
# Training the DCGANs
criterion = nn.BCELoss() # We create a criterion object that will measure the error between the prediction and the target.
optimizerD = optim.Adam(netD.parameters(), lr = 0.0002, betas = (0.5, 0.999)) # We create the optimizer object of the discriminator.
optimizerG = optim.Adam(netG.parameters(), lr = 0.0002, betas = (0.5, 0.999)) # We create the optimizer object of the generator.
for epoch in range(25): # We iterate over 25 epochs.
for i, data in enumerate(dataloader, 0): # We iterate over the images of the dataset.
# 1st Step: Updating the weights of the neural network of the discriminator
netD.zero_grad() # We initialize to 0 the gradients of the discriminator with respect to the weights.
# Training the discriminator with a real image of the dataset
real, _ = data # We get a real image of the dataset which will be used to train the discriminator.
input = Variable(real) # We wrap it in a variable.
target = Variable(torch.ones(input.size()[0])) # We get the target.
output = netD(input) # We forward propagate this real image into the neural network of the discriminator to get the prediction (a value between 0 and 1).
errD_real = criterion(output, target) # We compute the loss between the predictions (output) and the target (equal to 1).
# Training the discriminator with a fake image generated by the generator
noise = Variable(torch.randn(input.size()[0], 100, 1, 1)) # We make a random input vector (noise) of the generator.
fake = netG(noise) # We forward propagate this random input vector into the neural network of the generator to get some fake generated images.
target = Variable(torch.zeros(input.size()[0])) # We get the target.
output = netD(fake.detach()) # We forward propagate the fake generated images into the neural network of the discriminator to get the prediction (a value between 0 and 1).
errD_fake = criterion(output, target) # We compute the loss between the prediction (output) and the target (equal to 0).
# Backpropagating the total error
errD = errD_real + errD_fake # We compute the total error of the discriminator.
errD.backward() # We backpropagate the loss error by computing the gradients of the total error with respect to the weights of the discriminator.
optimizerD.step() # We apply the optimizer to update the weights according to how much they are responsible for the loss error of the discriminator.
# 2nd Step: Updating the weights of the neural network of the generator
netG.zero_grad() # We initialize to 0 the gradients of the generator with respect to the weights.
target = Variable(torch.ones(input.size()[0])) # We get the target.
output = netD(fake) # We forward propagate the fake generated images into the neural network of the discriminator to get the prediction (a value between 0 and 1).
errG = criterion(output, target) # We compute the loss between the prediction (output between 0 and 1) and the target (equal to 1).
errG.backward() # We backpropagate the loss error by computing the gradients of the total error with respect to the weights of the generator.
optimizerG.step() # We apply the optimizer to update the weights according to how much they are responsible for the loss error of the generator.
# 3rd Step: Printing the losses and saving the real images and the generated images of the minibatch every 100 steps
print('[%d/%d][%d/%d] Loss_D: %.4f Loss_G: %.4f' % (epoch, 25, i, len(dataloader), errD.data[0], errG.data[0])) # We print les losses of the discriminator (Loss_D) and the generator (Loss_G).
if i % 100 == 0: # Every 100 steps:
vutils.save_image(real, '%s/real_samples.png' % "./results", normalize = True) # We save the real images of the minibatch.
fake = netG(noise) # We get our fake generated images.
vutils.save_image(fake.data, '%s/fake_samples_epoch_%03d.png' % ("./results", epoch), normalize = True) # We also save the fake generated images of the minibatch.