Variational_autoencoder.py

__author__ = 'Sherlock Holmes'

import torch
import torchvision
from torch import nn
from torch import optim
import torch.nn.functional as F
from torch.autograd import Variable
from torch.utils.data import DataLoader
import os
import torch.optim as optim
from utils import *
from torch.utils.data import DataLoader
import matplotlib.pyplot as plt
import shutil

if not os.path.exists('./vae_img'):
    os.mkdir('./vae_img')

a_l=100; a_h=500;
b_l=70; b_h=300;
c_l=70; c_h=300;
#r_l=100; r_h=750;
#v_l=0.5;v_h=5;
n=20000
dim=3
ranges=[a_l,a_h,b_l,b_h,c_l,c_h]             

input_size=dim                            
output_size=dim                          


device='cpu'
num_epochs = 500
batch_size = 64
learning_rate = 1e-3
_data= gen_test_data(n,dim,ranges)
print('_data shape:',_data.shape)

os.environ["CUDA_DEVICE_ORDER"]="PCI_BUS_ID"
os.environ["CUDA_VISIBLE_DEVICES"]="0"  # specify which GPU(s) to be used

loss_train=[]; loss_validate=[]


flag_first=0
train_data,validation_data= data_split(_data,proportion=0.1)
print('Train data:',train_data.shape,'validate data:',validation_data.shape)
copied_train_data=np.copy(train_data)
copied_validation_data=np.copy(validation_data)
        
fitted_train_data= data_preperation(copied_train_data,np.array(ranges))
fitted_validation_data= data_preperation(copied_validation_data,np.array(ranges))
train_data = SimDataset(fitted_train_data)
validate_data = SimDataset(fitted_validation_data)


class VAE(nn.Module):
    def __init__(self):
        super(VAE, self).__init__()

        self.fc1 = nn.Linear(3, 128)
        self.fc2 = nn.Linear(128, 256)
        self.fc3 = nn.Linear(256, 512)
        self.fc41 = nn.Linear(512, 2)
        self.fc42 = nn.Linear(512, 2)
        self.fc5 = nn.Linear(2, 512)
        self.fc6 = nn.Linear(512,256)
        self.fc7 = nn.Linear(256,128)
        self.fc8 = nn.Linear(128, 3)

    def encode(self, x):
        h1 = F.relu(self.fc3(F.relu(self.fc2(F.relu(self.fc1(x))))))
        return self.fc41(h1), self.fc42(h1)

    def reparametrize(self, mu, logvar):
        std = logvar.mul(0.5).exp_()
        if device=='cuda':
            eps = torch.cuda.FloatTensor(std.size()).normal_()
        else:
            eps = torch.FloatTensor(std.size()).normal_()
        eps = Variable(eps)
        return eps.mul(std).add_(mu)

    def decode(self, z):
        h3 = F.relu(self.fc7(F.relu(self.fc6(F.relu(self.fc5(z))))))  
        return F.sigmoid(self.fc8(h3))

    def forward(self, x):
        mu, logvar = self.encode(x)
        z = self.reparametrize(mu, logvar)
        return self.decode(z), mu, logvar


model = VAE()
if device=='cuda':
    model.cuda()

reconstruction_function = nn.L1Loss(size_average=False)
#reconstruction_function = nn.MSELoss(size_average=False)

def loss_function(recon_x, x, mu, logvar):
    BCE = reconstruction_function(recon_x, x)  # mse loss
    BCE *=3*3
    # loss = 0.5 * sum(1 + log(sigma^2) - mu^2 - sigma^2)
    KLD_element = mu.pow(2).add_(logvar.exp()).mul_(-1).add_(1).add_(logvar)
    KLD = torch.sum(KLD_element).mul_(-0.5)
    # KL divergence
    return BCE + KLD


optimizer = optim.Adam(model.parameters(), lr=0.001)

for epoch in range(num_epochs):
    print('epoch is:',epoch)
    model.train()
    train_loss = 0
    if epoch > num_epochs:
           break    
    try:
                dataloader = DataLoader(train_data, batch_size, True)
                correct = 0
                for x,_ in dataloader:
                	#print('x is:',x) 
                	x = Variable(x)
                	x= x.to(device)
                	optimizer.zero_grad(); 
                	recon_batch, mu, logvar = model(x); #print('recon batch:',recon_batch)
                	loss = loss_function(recon_batch,x, mu, logvar)
                	loss.backward() 
                	optimizer.step();
                	correct+= loss.item()
                train_loss=correct/len(train_data); loss_train.append(train_loss)
                #train_loss=correct; loss_train.append(train_loss)
                
                
    except KeyboardInterrupt:
                break
           
                     
fig=plt.figure(figsize=(9,6))
plt.plot(loss_train,label='training')
plt.legend()
plt.show()

torch.save(model.state_dict(), './vae.pt')


def plot3D_data(X,title):
   image_name= './images/'+title+'.png'

   from mpl_toolkits.mplot3d import Axes3D
   Axes3D = Axes3D  # pycharm auto import
   fig = plt.figure()
   ax = fig.add_subplot(111, projection='3d')
   ax.scatter(X[:,0], X[:,1], X[:,2])
   plt.title(title)
   plt.savefig(image_name)


# load the model, sample and regenerate space

# plot input and output space and compare

# write sample from normal dist 
samples= torch.from_numpy(np.random.rand(n,2).astype(float) )
#print(samples.dtype)
output= model.decode(samples.float())
#print('Samples are:',samples)

output=output.cpu().detach().numpy()
#estimate_accuracy(test_data,output)
output=rescale_data(output,ranges)
#print('Reconstructed Output is:',output)

plot3D_data(_data,'input_space')
plot3D_data(output,'output_space')

# checker function to ensure the generated data is within the bound ( take it from earlier RRCF work) 
min=[a_l,b_l,c_l]; max=[a_h,b_h,c_h]
def check_bound_samples(data,box):
    print('data',data,'box',box)
    print('box 0 is',box[0],'box[1] is',box[1])
    data=np.where((box[0].reshape(-1,1)-data) >0, -100000, data)
    #data=np.where((0-data>0,0,data))
    print('min ceiled data is:',data)
    data=np.where((data-box[1].reshape(-1,1)) >0, -100000, data)
    print('new data is:',data)
    
def create_bound_box(min,max,samples): 
    return np.concatenate((np.full((1,samples), min),np.full((1,samples),max)),axis=0)