model.py

# Some code was borrowed from https://github.com/hwalsuklee/tensorflow-mnist-VAE/blob/master/vae.py

import torch
import torch.nn as nn
import torch.nn.functional as F

class Encoder(nn.Module):
    def __init__(self, img_dim, hidden_dim, z_dim, dropout = 0.5):
        super(Encoder, self).__init__()
        
        self.img_dim = img_dim
        self.hidden_dim = hidden_dim
        self.z_dim = z_dim

        self.drop = nn.Dropout(p = dropout)

        self.linear1 = nn.Linear(
                            self.img_dim,
                            self.hidden_dim
                         )
        self.linear2 = nn.Linear(
                            self.hidden_dim,
                            self.hidden_dim,
                        )
        # In order to make mean, stddev, we take output dimension equals 2 * self.z_dim 
        self.out_layer = nn.Linear(
                            self.hidden_dim,
                            self.z_dim * 2
                        )

        # He Initialization
        for m in self.modules():
            if isinstance(m, nn.Linear):
                nn.init.kaiming_normal_(m.weight)
                nn.init.constant_(m.bias, 0.0)
        
        
    def forward(self, x):

        x = F.relu(self.linear1(x))
        x = self.drop(x)

        x = F.relu(self.linear2(x))
        x = self.drop(x)

        params = self.out_layer(x)

        # mu : mean, sigma : standard deviation
        mu = params[:, :self.z_dim]
        # The standard deviation must be positive. Parametrize with a softplus and
        # add a small epsilon for numerical stability
        sigma = 1e-6 + F.softplus(params[:, self.z_dim:])

        return mu, sigma


class Decoder(nn.Module):

    def __init__(self, z_dim, hidden_dim, img_dim, dropout = 0.5):
        super(Decoder, self).__init__()

        self.z_dim = z_dim
        self.hidden_dim = hidden_dim
        self.img_dim = img_dim
        
        self.drop = nn.Dropout(p = dropout)

        self.linear1 = nn.Linear(
                            self.z_dim,
                            self.hidden_dim
                         )
        self.linear2 = nn.Linear(
                            self.hidden_dim,
                            self.hidden_dim,
                        )
        self.linear3 = nn.Linear(
                            self.hidden_dim,
                            self.img_dim
                        )

        # He Initialization
        for m in self.modules():
            if isinstance(m, nn.Linear):
                nn.init.kaiming_normal_(m.weight)
                nn.init.constant_(m.bias, 0.0)

    def forward(self, x):

        x = F.relu(self.linear1(x))
        x = self.drop(x)

        x = F.relu(self.linear2(x))
        x = self.drop(x)

        x = torch.sigmoid(self.linear3(x))

        return x


# In order to use backpropagation, reparametrize sampling 
class VAE(nn.Module):
    
    def __init__(self, img_dim, z_dim, hidden_dim, dropout):
        super().__init__()

        
        self.img_dim = img_dim
        self.z_dim = z_dim
        self.hidden_dim = hidden_dim
        
        self.dropout = dropout

        self.encoder = Encoder(
                            self.img_dim,
                            self.hidden_dim,
                            self.z_dim,
                            self.dropout
                        )
        self.decoder = Decoder(
                            self.z_dim,
                            self.hidden_dim,
                            self.img_dim,
                            self.dropout
                        )

        
    def forward(self, x):

        mu, sigma = self.encoder(x)
        z = mu + sigma * torch.randn_like(mu)
        x_target = self.decoder(z)

        return x_target, mu, sigma


def vae_loss(x_target, x, mu, sigma):
    batch_size = x.size(0)
    
    generative_loss = F.binary_cross_entropy(x_target, x, reduction = 'sum')

    KLD_loss = 0.5 * torch.sum(
                                torch.pow(mu, 2) +
                                torch.pow(sigma, 2) -
                                torch.log(1e-8 + torch.pow(sigma, 2)) -1
                            ).sum() / batch_size
    
    loss = generative_loss + KLD_loss
    
    return loss


# a = torch.rand(10, 30)
# b = torch.rand(10, 30)
# c = torch.rand(10, 30)
# model = VAE(a,b, 30, 40, 40, 0.4)
# model.eval()
# print(model.get_ae(c))