RNN_VAE.py

import torch
import numpy as np
from torch import nn, optim
from model.RNNVAENet import RNNVAENet

# TODO: Working in Progress
class RNNVAE:
    def __init__(self, args):
        self.input_size = args.input_size
        self.hidden_size = args.hidden_size
        self.flow_dim = args.flow_dim
        self.num_of_labels = args.label_dim
        self.n_blocks = args.n_blocks
        self.num_epochs = args.epochs
        self.learning_rate = args.learning_rate
    
        self.device = torch.device("cuda:%d" % args.gpuID if args.cuda else "cpu")
        self.network = RNNVAENet(
            self.input_size, 
            self.hidden_size, 
            self.flow_dim, 
            self.input_size,
            self.num_of_labels,
            self.n_blocks,
            self.device)
        if self.network is not None:
            self.network.to(self.device)
        self.optimizer = optim.Adam(self.network.parameters(), lr=self.learning_rate, weight_decay=1e-6)

    def loss_function(self, x, recon_x, y, pred_y, sum_log_det):
        MSE = nn.MSELoss(reduction='mean')(recon_x, x)
        PRED = nn.MSELoss(reduction='mean')(pred_y, y)
        FLOW = sum_log_det.mean()
        return MSE+PRED, MSE, PRED, FLOW
    
    def smape(self, y, pred_y):
        return torch.sum(torch.abs(y-pred_y)/(torch.abs(pred_y) + torch.abs(y)),0)

    def train_epoch(self, epoch, optimizer, data_loader):
        """Train the model for one epoch
        Args:
            optimizer: (Optim) optimizer to use in backpropagation
            data_loader: (DataLoader) corresponding loader containing the training data
        Returns:
            average of all loss values, accuracy, nmi
        """
        self.network.train()
        total_loss = 0.
        recon_loss = 0.
        flow_loss = 0.
        label_loss = 0.
        smape = torch.zeros([1,5])
        # accuracy = 0.
        num_batches = 0.
        
        # true_labels_list = []
        # predicted_labels_list = []

        # iterate over the dataset
        for (data, y) in data_loader:
            data = data.to(self.device)
            if len(y.shape)==1:
                y=y.view(-1,1)
            y = y.to(self.device)
            #e = e.view(-1,1).to(self.device)

            optimizer.zero_grad()

            # flatten data
            # data = data.view(data.size(0), -1)
            
            # forward call
            recon, y_pred = self.network(data, data, teaching_ratio= 0.25) 
            log_jacob = self.network.flow.get_sum_log_det()
            total, MSE, PRED, FLOW = self.loss_function(data, recon, y, y_pred, log_jacob)
            smape += self.smape(y, y_pred).detach().cpu()
            # accumulate values
            total_loss += total.item()
            label_loss += PRED.item()

            #print(MSE.item(), PRED.item(), FLOW.item())
            

            # perform backpropagation
            total.backward()
            optimizer.step()  

            # # save predicted and true labels
            # predicted = unlab_loss_dic['predicted_labels']

            # true_labels_list.append(labels)
            # predicted_labels_list.append(predicted)   
            num_batches += 1. 
            if num_batches % 50 == 0:
                print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
                    epoch, num_batches * len(data), len(data_loader.dataset),
                    100. * num_batches / len(data_loader),  total.item()))


        # average per batch
        total_loss /= num_batches
        label_loss /= num_batches
        smape /= len(data_loader.dataset)

        print('====> Epoch: {} Average loss per batch: {:.4f};\n'.format(epoch, total_loss))
        
        # # concat all true and predicted labels
        # true_labels = torch.cat(true_labels_list, dim=0).cpu().numpy()
        # predicted_labels = torch.cat(predicted_labels_list, dim=0).cpu().numpy()

        # # compute metrics

        # accuracy = 100.0 * self.metrics.cluster_acc(predicted_labels, true_labels)
        # nmi = 100.0 * self.metrics.nmi(predicted_labels, true_labels)

        return total_loss, label_loss, smape.numpy()

    def test(self, epoch, data_loader, return_loss=False):
        """Test the model with new data
        Args:
            data_loader: (DataLoader) corresponding loader containing the test/validation data
            return_loss: (boolean) whether to return the average loss values
            
        Return:
            accuracy and nmi for the given test data
        """
        self.network.eval()
        total_loss = 0.
        recon_loss = 0.
        flow_loss = 0.
        label_loss = 0.
        num_batches = 0.
        smape = torch.zeros([1,5])

        with torch.no_grad():
            for data, y in data_loader:
                data = data.to(self.device)
                if len(y.shape)==1:
                    y=y.view(-1,1)
                y = y.to(self.device)
            
                # flatten data
                # data = data.view(data.size(0), -1)

                # forward call
                
                recon, y_pred = self.network(data, data, teaching_ratio= 0) 
                log_jacob = self.network.flow.get_sum_log_det()
                total, MSE, PRED, FLOW = self.loss_function(data, recon, y, y_pred, log_jacob)
                # accumulate values
                total_loss += total.item()
                label_loss += PRED.item()
                smape += self.smape(y, y_pred).detach().cpu()
                num_batches += 1. 
        
      
        # average per batch
        if return_loss:
            total_loss /= num_batches
            label_loss /= num_batches
        
        smape /= len(data_loader.dataset)
        print('====> Test Epoch: {} Average loss per batch: {:.4f};'.format(epoch, total_loss))
        print('====> SMAPE: ' + str(smape))

        if return_loss:
            return total_loss, label_loss, smape.numpy()


    def train(self, train_loader, val_loader):
        """Train the model
        Args:
            train_loader: (DataLoader) corresponding loader containing the training data
            val_loader: (DataLoader) corresponding loader containing the validation data
        Returns:
            output: (dict) contains the history of train/val loss
        """
        train_history_err, val_history_err = [], []
        train_history_smape = np.zeros([self.num_of_labels,self.num_epochs])
        test_history_smape = np.zeros([self.num_of_labels,self.num_epochs])

        for epoch in range(1, self.num_epochs + 1):
            train_loss,energy_loss,smape_train = self.train_epoch(epoch, self.optimizer, train_loader)
            val_loss,val_energy_loss, smape_test = self.test(epoch, val_loader, True)
            train_history_err.append(energy_loss)
            val_history_err.append(val_energy_loss)
            train_history_smape[:,epoch-1] = smape_train
            test_history_smape[:,epoch-1] = smape_test


        return {'train_history_err' : train_history_err, 'val_history_err': val_history_err, 'smape_train': train_history_smape, 'smape_test': test_history_smape}