net.py

from abc import abstractmethod
import tensorflow as tf
from tensorflow import keras
from tensorflow.keras import layers
from tensorflow.keras.models import load_model
from tensorflow.keras.layers import (Dense, Dropout, Conv2D, Flatten, MaxPooling2D, Conv1D, BatchNormalization) 
from copy import deepcopy
from sklearn.model_selection import train_test_split
import datetime
import visualkeras

import pickle
import numpy as np

import losses
import util
import keras_preprocessing_custom.image

time_str = datetime.datetime.now().strftime('%d_%m_%Y__%H:%M:%S')

class NN:
    ''' The neural network class that creates and trains the  model. 
    
        Attributes
        ----------
        sim : The simulation object located in simulation.py

        eeg_topographies : ndarray (n_samples,67,67)
            A set of topographies for each eeg signal in simulation. This argument is necessary for the CNN only.

        Methods
        -------
        fit : trains the neural network with the EEG and source data
        train : trains the neural network with the EEG and source data
        predict : perform prediciton on EEG data
        evaluate : evaluate the performance of the model
    '''

    def __init__(self, sim, verbose=True):
        #self.sim = deepcopy(sim)
        self.sim = sim

        self.n_elec = self.sim.fwd.leadfield.shape[0]
        self.n_dipoles = self.sim.fwd.leadfield.shape[1]

        # simulation's samples
        self.n_samples = self.sim.eeg_data.shape[1]
        self.compiled = False

        self.verbose = verbose
        self.trained = False

    @abstractmethod
    def build_model(self):
        ''' Build the neural network architecture.       
        '''
        pass

    @abstractmethod
    def fit(self, learning_rate=0.001, 
        validation_split=0.2, epochs=500, batch_size=64, 
        loss=None, patience=250
    ):
        ''' Train the neural network using training data (eeg) and labels (sources).

            The training data are stored in the simulation object
            
            Parameters
            ----------

            learning_rate : float
                The learning rate for training the neural network
            validation_split : float
                Proportion of data to keep as validation set.
            epochs : int
                Number of epochs to train. In one epoch all training samples 
                are used once for training.
            batch_size : int
                The number of samples to simultaneously calculate the error 
                during backpropagation.
            loss : tf.keras.losses
                The loss function.
            patience: int
                Number of epochs with no improvement after which trainning will be stopped
            Return
            ------
            history, tensorboard dir : keras.callbacks.History, string
                Method returns the history and the log dir for the tensorboard.

        '''
        pass
    
    def predict(self, eeg):
        ''' Predict the sources from the eeg.
        '''
        if self.trained:
            predicted_sources = self.model.predict(eeg)
            return predicted_sources
        
        else:
            raise AttributeError('The model must be trained first.')


    @abstractmethod
    def evaluate_mse(self, eeg, sources):
        ''' Evaluate the model regarding mean squared error
        
        Parameters
        ----------         
            eeg : numpy.ndarray
                The simulated EEG data
            sources : numpy.ndarray
                The simulated EEG data

        Return
        ------
            mean_squared_errors : numpy.ndarray
            The mean squared error of each sample
        '''
        
        pass


    def save_nn(self, model_filename, save_sim=False, sim_filename='sim.pkl'):
        if self.trained:
            self.model.save(model_filename)

            if save_sim:
                with open(sim_filename, 'wb') as outp:  # Overwrites any existing file.
                    pickle.dump(self.sim, outp, pickle.HIGHEST_PROTOCOL)

        else:
            print('The model must be trained first.')
    
    def load_nn(self, model_filename):
        ''' This function loads the neural network.

            !Important!
            -----------
            The simulation object must be the same with the one that it was used during trainning. 
        '''
        self.model = load_model(model_filename,  compile=False)
        self.compiled = True
        self.trained = True
        print('Loaded model in', self.__class__.__name__,':')
        self.model.summary()

    @staticmethod
    def lr_schedule(epoch):
        '''
            Returns a custom learning rate that decreases as epochs progress.
        '''
        learning_rate = 0.01
        if epoch > 40:
            learning_rate = 0.001

        tf.summary.scalar('learning rate', data=learning_rate, step=epoch)
        return learning_rate


class EEGMLP(NN):
    '''  An MLP that predicts the location of the activation in the source space.
    It does not predict the the electrical current of each dipole.
   
    '''
    def __init__(self, sim, num_of_simultaneously_dipoles=1,verbose=True):
        super().__init__(sim, verbose)
        # number of dipoles that operate the same time.
        self.num_of_simultaneously_dipoles = num_of_simultaneously_dipoles
    
    def build_model(self):
        ''' Build the neural network architecture using the 
        tensorflow.keras.Sequential() API. 

        The architecture is an MLP with three hidden layers.
       
        '''
        if not self.compiled :
            # Build the artificial neural network model using Dense layers.
            self.model = keras.Sequential()

            # add input layer
            self.model.add(keras.Input(shape=(self.n_elec,)))

            self.model.add(Dense(1024, activation='relu'))
            self.model.add(BatchNormalization())
            self.model.add(Dropout(0.25))
            self.model.add(Dense(1024, activation='relu'))
            self.model.add(BatchNormalization())
            self.model.add(Dropout(0.25))
            self.model.add(Dense(1024, activation='relu'))
            self.model.add(BatchNormalization())
            self.model.add(Dropout(0.25))
            
            # Add output layer
            self.model.add(Dense(3*self.num_of_simultaneously_dipoles, activation='relu'))

            self.model.summary()
            if self.verbose:
                img = './assets/MLP.png'
                img_keras = './assets/MLP-visual-keras.png'
                tf.keras.utils.plot_model(self.model, to_file=img, show_shapes=True, show_layer_names=False)
                visualkeras.layered_view(self.model, legend=True,  to_file=img_keras)  


    def fit(self, learning_rate=0.001, 
        validation_split=0.2, epochs=500, batch_size=32, 
        loss=None, patience=250
    ):

        if len(self.sim.eeg_data.shape) != 2 :
            raise AttributeError("EEG data must be 2D (n_elctrodes x n_samples")

        tensorboard_dir = 'logs/MLP-Model-{}'.format(time_str)
        tensorboard_callback = tf.keras.callbacks.TensorBoard(log_dir=tensorboard_dir)
        
        # Input data
        x = self.sim.eeg_data.T        

        # Target data (3D locations in the source space)
        y = self.sim.locations        

        # early stoping
        es = tf.keras.callbacks.EarlyStopping(monitor='val_loss', \
            mode='min', patience=patience, restore_best_weights=True, verbose=1)

        optimizer = tf.keras.optimizers.Adam(learning_rate=learning_rate)


        if loss == None:
            loss = 'mse'
        
        metrics = [
            tf.keras.metrics.MeanAbsoluteError(name="MAE")
            #tf.keras.metrics.MeanAbsolutePercentageError(name="MAPE")            
        ]

        if not self.compiled:
            self.model.compile(optimizer, loss, metrics=metrics)
            self.compiled = True

        history = self.model.fit(x, y, 
                epochs=epochs, batch_size=batch_size, shuffle=True, 
                validation_split=validation_split, callbacks=[es, tensorboard_callback])
        self.trained = True
        
        return history, tensorboard_dir

    
    def evaluate_mse(self, eeg, sources):
        ''' Evaluate the model regarding mean squared error

        '''
        
        if self.trained:

            if eeg.shape[1]  != sources.shape[1]:
                raise AttributeError('EEG and Sources data must have the same amount of samples.')

            predicted_sources = self.predict(eeg=eeg.T).T        
            mean_squared_errors = np.mean((predicted_sources - sources)**2, axis=0)

            return mean_squared_errors
        else :
            print('The model must be trained first.')


class EEG_CNN(NN):
    ''' A CNN to solve the inverse problem. It predicts the electrical current of each dipole in the source space

        The additional eeg_topographies argument is a set of topographies for each eeg signal
        in simulations.
    '''

    def __init__(self, sim, eeg_topographies, verbose=True):
        super().__init__(sim, verbose)

        if len(eeg_topographies.shape) != 3 :
            raise AttributeError('The set of topographies must be a 3D-array. (n_samples x xpxiels x ypixels)')
        elif eeg_topographies.shape[0] != self.n_samples :
            raise AttributeError('Incompatible sim and topographies.')
        
        self.eeg_topographies = eeg_topographies


    def build_model(self):
        ''' Build the neural network architecture using the 
        tensorflow.keras.Sequential() API. 

        The architecture is a CNN with three hidden layers.
       
        '''
        if not self.compiled :
            # Build the artificial neural network model using Dense layers.
            self.model = keras.Sequential()

            # add input layer
            self.model.add(keras.Input(shape=(self.eeg_topographies.shape[1], self.eeg_topographies.shape[2],1), name='Input'))
            self.model.add(Conv2D(8, kernel_size=(3, 3), activation='relu'))
            #self.model.add(BatchNormalization())
            self.model.add(Flatten())            
            self.model.add(Dense(1024, activation='relu'))
            self.model.add(BatchNormalization())
            self.model.add(Dropout(0.25))
            self.model.add(Dense(1024, activation='relu'))
            self.model.add(BatchNormalization())
            self.model.add(Dropout(0.25))
            self.model.add(Dense(1024, activation='relu'))
            self.model.add(BatchNormalization())
            self.model.add(Dropout(0.25))
            # Add output layer
            self.model.add(Dense(self.n_dipoles, activation='relu', name='OutputLayer'))

            self.model.summary()
            
            if self.verbose:
                img = './assets/CNN.png'
                img_keras = './assets/CNN-visual-keras.png'
                tf.keras.utils.plot_model(self.model, to_file=img, show_shapes=True, show_layer_names=False)
                visualkeras.layered_view(self.model, legend=True,  to_file=img_keras)  
    

    def fit(self, learning_rate=0.001, 
        validation_split=0.2, epochs=500, batch_size=64, 
        loss=None, patience=250
    ):

        if len(self.sim.eeg_data.shape) != 2 :
            raise AttributeError("EEG data must be 2D (n_elctrodes x n_samples")
        elif len(self.sim.source_data.shape) != 2 :
            raise AttributeError("Sources data must be 2D (n_dipoles x n_samples")

        tensorboard_dir = 'logs/CNN-Model-{}'.format(time_str)
        tensorboard_callback = tf.keras.callbacks.TensorBoard(log_dir=tensorboard_dir)

        # Input data
        x = self.eeg_topographies       

        # Target data
        y = self.sim.source_data.T        

        # early stoping
        es = tf.keras.callbacks.EarlyStopping(monitor='val_loss', \
            mode='min', patience=patience, restore_best_weights=True,verbose=1)


        if loss == None:
            loss = 'mse'

        metrics = [
            tf.keras.metrics.MeanAbsoluteError(name='MAE')
        ]

        #lr_callback = keras.callbacks.LearningRateScheduler(NN.lr_schedule)
        optimizer = tf.keras.optimizers.Adam(learning_rate=learning_rate)

        if not self.compiled:
            self.model.compile(optimizer, loss, metrics=metrics)
            self.compiled = True

        
        #x_scaled = util.standardize_dataset(x)
        #y_scaled = util.normalize_array(y)

        # scale topos and sources
        history = self.model.fit(x, y, 
                epochs=epochs, batch_size=batch_size, shuffle=True, 
                validation_split=validation_split, callbacks=[es, tensorboard_callback])
        self.trained = True
        
        return history, tensorboard_dir

    
    def evaluate_mse(self, eeg, sources):
        ''' Evaluate the model regarding mean squared error
        
            The eeg parameter must be the eeg-topographies
        '''
        
        if self.trained:

            if len(eeg.shape) != 3 :
                raise AttributeError('The set of topographies must be a 3D-array. (n_samples x xpxiels x ypixels)')
            elif eeg.shape[0] != sources.shape[1] :
                raise AttributeError('Incompatible sim and topographies.')
           

            predicted_sources = self.predict(eeg=eeg).T        
            mean_squared_errors = np.mean((predicted_sources - sources)**2, axis=0)

            return mean_squared_errors
        else :
            print('The model must be trained first.')


class LocCNN(NN):
    ''' A CNN that predicts the location of the activation in the source space.
    It does not predict the the electrical current of each dipole.

    The additional eeg_topographies argument is a set of topographies for each eeg signal
    in simulations.
    '''
    def __init__(self, sim, eeg_topographies, num_of_simultaneously_dipoles=1,verbose=True):
        super().__init__(sim, verbose)

        if len(eeg_topographies.shape) != 3 :
            raise AttributeError('The set of topographies must be a 3D-array. (n_samples x xpxiels x ypixels)')
        elif eeg_topographies.shape[0] != self.n_samples :
            raise AttributeError('Incompatible sim and topographies.')
        
        self.eeg_topographies = eeg_topographies
        # number of dipoles that operate the same time.
        self.num_of_simultaneously_dipoles = num_of_simultaneously_dipoles


    def build_model(self):
        ''' Build the neural network architecture using the 
        tensorflow.keras.Sequential() API. 

        The architecture is a CNN with three hidden layers.
       
        '''
        if not self.compiled :
            # Build the artificial neural network model using Dense layers.
            self.model = keras.Sequential()

            # add input layer
            self.model.add(keras.Input(shape=(self.eeg_topographies.shape[1], self.eeg_topographies.shape[2],1), name='Input'))
            self.model.add(Conv2D(8, kernel_size=(3, 3), activation='relu'))
            self.model.add(MaxPooling2D(pool_size=(2, 2)))
            self.model.add(Conv2D(16, kernel_size=(3, 3), activation='relu'))

            self.model.add(Flatten())            
            self.model.add(Dropout(0.25))
            self.model.add(Dense(1024, activation='relu'))
            self.model.add(BatchNormalization())
            self.model.add(Dropout(0.25))
            self.model.add(Dense(2048, activation='relu'))
            self.model.add(BatchNormalization())
            self.model.add(Dropout(0.25))
            self.model.add(Dense(5096, activation='relu'))
            self.model.add(BatchNormalization())
            self.model.add(Dropout(0.25))
            # Add output layer with only 3 output neurons, one for each coordinate in the 3D-space.
            self.model.add(Dense(3*self.num_of_simultaneously_dipoles, activation='relu'))

            self.model.summary()
            
            if self.verbose:
                img = './assets/LocCNN.png'
                img_keras = './assets/LocCNN-visual-keras.png'
                tf.keras.utils.plot_model(self.model, to_file=img, show_shapes=True, show_layer_names=False)
                visualkeras.layered_view(self.model, legend=True,  to_file=img_keras)  


    def fit(self, learning_rate=0.001, 
        validation_split=0.2, epochs=500, batch_size=32, 
        loss=None, patience=250
    ):

        if len(self.sim.eeg_data.shape) != 2 :
            raise AttributeError("EEG data must be 2D (n_elctrodes x n_samples")

        # Input data
        x = self.eeg_topographies       

        # Target data (3D locations in the source space)
        y = self.sim.locations        

        # early stoping
        es = tf.keras.callbacks.EarlyStopping(monitor='val_loss', \
            mode='min', patience=patience, restore_best_weights=True,verbose=1)


        if loss == None:
            loss = tf.keras.losses.MeanAbsoluteError()

        metrics = [#tf.keras.metrics.MeanAbsolutePercentageError(name="MAPE"),
            'mse'         
        ]

        #lr_callback = keras.callbacks.LearningRateScheduler(NN.lr_schedule)
        optimizer = tf.keras.optimizers.SGD(learning_rate=0.001)

        if not self.compiled:
            self.model.compile(optimizer, loss, metrics=metrics)
            self.compiled = True

        
        #x_scaled = util.standardize_dataset(x)
        #y_scaled = util.normalize_array(y)

        # scale topos and sources
        history = self.model.fit(x, y, 
                epochs=epochs, batch_size=batch_size, shuffle=True, 
                validation_split=validation_split, callbacks=[es])
        self.trained = True
        
        return history


class EEGLargeCnn():
    ''' This CNN it is used only for the full source space (50460 dipoles) and it is trained using a  keras.utils.Sequence
    from the package  keras_preprocessing_custom. It can be used a very large dataset because the data are loaded in batches
    from the directories y and x . 

        Arguments
        ---------
            dir_y : directory with the sources dataset.
            dir_x : directory with the topos dataset.
    '''

    def __init__(self,dir_y,dir_x,dir_y_eval=None,dir_x_eval=None,
        verbose=False,dipoles=50460
        ):

        self.dir_y = dir_y
        self.dir_x = dir_x
        self.dir_y_eval = dir_y_eval
        self.dir_x_eval = dir_x_eval

        self.n_dipoles = dipoles
        self.verbose = verbose


    def build_model(self):
        ''' Build the neural network architecture using the 
        tensorflow.keras.Sequential() API. 

        The architecture is a CNN with three hidden layers.
       
        '''
      
        # Build the artificial neural network model using Dense layers.
        self.model = keras.Sequential()

        # add input layer
        self.model.add(keras.Input(shape=(67,67,1), name='Input'))
        self.model.add(Conv2D(8, kernel_size=(3, 3), activation='relu'))
        #self.model.add(BatchNormalization())
        self.model.add(Flatten())            
        self.model.add(Dense(1024, activation='relu'))
        self.model.add(BatchNormalization())
        self.model.add(Dropout(0.25))
        self.model.add(Dense(1024, activation='relu'))
        self.model.add(BatchNormalization())
        self.model.add(Dropout(0.25))
        self.model.add(Dense(1024, activation='relu'))
        self.model.add(BatchNormalization())
        self.model.add(Dropout(0.25))
        # Add output layer
        self.model.add(Dense(self.n_dipoles, activation='relu', name='OutputLayer'))

        self.model.summary()
        
        if self.verbose:
            img = './assets/CNN.png'
            img_keras = './assets/CNN-visual-keras.png'
            tf.keras.utils.plot_model(self.model, to_file=img, show_shapes=True, show_layer_names=False)
            visualkeras.layered_view(self.model, legend=True,  to_file=img_keras)  
    
    def fit(self, learning_rate=0.001, epochs=500,
        batch_size=32,loss=None, patience=250
        ):
               
        loader = keras_preprocessing_custom.image.DataLoader()

        train_loader = loader.flow_from_directory(
            dir_y=self.dir_y,
            dir_x=self.dir_x,
            batch_size=batch_size,
        )        

        if loss == None:
            loss = 'mse'

        #lr_callback = keras.callbacks.LearningRateScheduler(NN.lr_schedule)
        optimizer = tf.keras.optimizers.Adam(learning_rate=learning_rate)

        self.model.compile(optimizer, loss, metrics=None)      

        
        if self.dir_x_eval != None and self.dir_y_eval != None:
            eval_loader = loader.flow_from_directory(
                dir_y=self.dir_y_eval,
                dir_x=self.dir_x_eval,
                batch_size=batch_size,
            )

            # early stoping
            es = tf.keras.callbacks.EarlyStopping(monitor='val_loss', \
                mode='min', patience=patience, restore_best_weights=True,verbose=1)

            history = self.model.fit(train_loader, 
                    epochs=epochs, batch_size=batch_size, shuffle=False, 
                    validation_data=eval_loader, #steps_per_epoch= train_loader.n / batch_size,
                    callbacks=[es]
                )
        else :
            es = tf.keras.callbacks.EarlyStopping(monitor='loss', \
                mode='min', patience=patience, restore_best_weights=True,verbose=1)

            history = self.model.fit(train_loader, 
                    epochs=epochs, batch_size=batch_size, shuffle=False, 
                    #steps_per_epoch= train_loader.n / batch_size,
                    callbacks=[es]
                )

        self.trained = True
        
        return history

    def predict(self, eeg_topos):
        ''' Predict the sources from the eeg_topos.
        '''
        predicted_sources = self.model.predict(eeg_topos)
        return predicted_sources
    
    def save_nn(self, model_filename):
        if self.trained:
            self.model.save(model_filename)
        else:
            print('The model must be trained first.')
    
    def load_nn(self, model_filename, trained_model=True):
        ''' This function loads the neural network.

            !Important!
            -----------
            The simulation object must be the same with the one that it was used during trainning. 
        '''
        self.model = load_model(model_filename,  compile=False)
        self.trained = trained_model
        print('Loaded model in', self.__class__.__name__,':')
        self.model.summary()