diff --git a/portiloop_software/__init__.py b/portiloop_software/__init__.py
index 80823c3..e69de29 100644
--- a/portiloop_software/__init__.py
+++ b/portiloop_software/__init__.py
@@ -1 +0,0 @@
-from portiloop_software.portiloop_python.ANN.portiloop_detector_training import run_offline_unlabelled, get_final_model_config_dict
diff --git a/portiloop_software/portiloop_python/ANN/configs.py b/portiloop_software/portiloop_python/ANN/configs.py
new file mode 100644
index 0000000..07d5dc2
--- /dev/null
+++ b/portiloop_software/portiloop_python/ANN/configs.py
@@ -0,0 +1,98 @@
+
+def get_nn_dict(config_name, ablation, index, split_i):
+
+    if config_name == 'spindle_net':
+        return {'experiment_name': f'spindleNet_{index}', 'device_train': 'cuda:0', 'device_val':
+                'cuda:0', 'nb_epoch_max': 500,
+                'max_duration': 257400, 'nb_epoch_early_stopping_stop': 100, 'early_stopping_smoothing_factor': 0.1, 'fe': 250,
+                'nb_batch_per_epoch': 1000,
+                'first_layer_dropout': False,
+                'power_features_input': True, 'dropout': 0.5, 'adam_w': 0.01, 'distribution_mode': 0, 'classification': True,
+                'reg_balancing': 'none',
+                'nb_conv_layers': 5,
+                'seq_len': 50, 'nb_channel': 40, 'hidden_size': 100, 'seq_stride_s': 0.004, 'nb_rnn_layers': 1, 'RNN': True,
+                'envelope_input': True,
+                "batch_size": 20, "lr_adam": 0.0009,
+                'window_size_s': 0.250, 'stride_pool': 1, 'stride_conv': 1, 'kernel_conv': 7, 'kernel_pool': 5,
+                'dilation_conv': 1, 'dilation_pool': 1, 'nb_out': 2, 'time_in_past': 1.55, 'estimator_size_memory': 139942400}
+        # put LSTM and Softmax for the occasion and add padding, not exactly the same frequency (spindleNet = 200 Hz)
+
+    elif config_name == 'ablation_portiloop':
+        return {'experiment_name': f'ABLATION_{ablation}_test_v11_implemented_on_portiloop_{index}', 'device_train': 'cuda:0', 'device_val':
+                'cuda:0', 'nb_epoch_max': 500,
+                'max_duration': 257400, 'nb_epoch_early_stopping_stop': 100, 'early_stopping_smoothing_factor': 0.1, 'fe': 250,
+                'nb_batch_per_epoch': 1000,
+                'first_layer_dropout': False,
+                'power_features_input': False, 'dropout': 0.5, 'adam_w': 0.01, 'distribution_mode': 0, 'classification': True,
+                'reg_balancing': 'none',
+                'nb_conv_layers': 4,
+                'seq_len': 50, 'nb_channel': 26, 'hidden_size': 7, 'seq_stride_s': 0.044, 'nb_rnn_layers': 2, 'RNN': True,
+                'envelope_input': True,
+                "batch_size": 256, "lr_adam": 0.0009,
+                'window_size_s': 0.234, 'stride_pool': 1, 'stride_conv': 1, 'kernel_conv': 7, 'kernel_pool': 9,
+                'dilation_conv': 1, 'dilation_pool': 1, 'nb_out': 2, 'time_in_past': 1.55, 'estimator_size_memory': 139942400,
+                'split_idx': split_i, 'validation_network_stride': 1}
+    elif config_name == 'pareto_search_small_seq':
+        return {'experiment_name': f'pareto_search_15_35_v5_small_seq_{index}', 'device_train': 'cuda:0', 'device_val': 'cuda:0', 'nb_epoch_max': 150,
+                'max_duration':
+                257400,
+                'nb_epoch_early_stopping_stop': 100, 'early_stopping_smoothing_factor': 0.1, 'fe': 250, 'nb_batch_per_epoch': 1000,
+                'first_layer_dropout': False,
+                'power_features_input': False, 'dropout': 0.5, 'adam_w': 0.01, 'distribution_mode': 0, 'classification': True,
+                'reg_balancing': 'none',
+                'split_idx': split_i, 'validation_network_stride': 1, 'nb_conv_layers': 3, 'seq_len': 50, 'nb_channel': 31, 'hidden_size': 7,
+                'seq_stride_s': 0.02,
+                'nb_rnn_layers': 1, 'RNN': True, 'envelope_input': False, 'lr_adam': 0.0005, 'batch_size': 256, 'window_size_s': 0.218,
+                'stride_pool': 1,
+                'stride_conv': 1, 'kernel_conv': 7, 'kernel_pool': 7, 'dilation_conv': 1, 'dilation_pool': 1, 'nb_out': 18, 'time_in_past': 8.5,
+                'estimator_size_memory': 188006400}
+    elif config_name == '2_inputs_network':
+        return {'experiment_name': f'ABLATION_{ablation}_2inputs_network_{index}', 'device_train': 'cuda:0', 'device_val':
+                'cuda:0', 'nb_epoch_max': 500,
+                'max_duration': 257400, 'nb_epoch_early_stopping_stop': 100, 'early_stopping_smoothing_factor': 0.1, 'fe': 250,
+                'nb_batch_per_epoch': 1000,
+                'first_layer_dropout': False,
+                'power_features_input': False, 'dropout': 0.5, 'adam_w': 0.01, 'distribution_mode': 0, 'classification': True,
+                'reg_balancing': 'none',
+                'nb_conv_layers': 4,
+                'seq_len': 50, 'nb_channel': 26, 'hidden_size': 7, 'seq_stride_s': 0.044, 'nb_rnn_layers': 2, 'RNN': True,
+                'envelope_input': True,
+                "batch_size": 256, "lr_adam": 0.0009,
+                'window_size_s': 0.234, 'stride_pool': 1, 'stride_conv': 1, 'kernel_conv': 7, 'kernel_pool': 9,
+                'dilation_conv': 1, 'dilation_pool': 1, 'nb_out': 2, 'time_in_past': 1.55, 'estimator_size_memory': 139942400,
+                'split_idx': split_i, 'validation_network_stride': 1}
+    elif config_name == 'pareto_search_v6':
+        return {'experiment_name': f'pareto_search_15_35_v6_{index}', 'device_train': 'cpu', 'device_val': 'cpu', 'nb_epoch_max': 500,
+                'max_duration':
+                257400,
+                'nb_epoch_early_stopping_stop': 100, 'early_stopping_smoothing_factor': 0.1, 'fe': 250, 'nb_batch_per_epoch': 1000,
+                'first_layer_dropout': False,
+                'power_features_input': False, 'dropout': 0.5, 'adam_w': 0.01, 'distribution_mode': 0, 'classification': True,
+                'reg_balancing': 'none',
+                'split_idx': split_i, 'validation_network_stride': 1, 'nb_conv_layers': 3, 'seq_len': 50, 'nb_channel': 31, 'hidden_size': 7,
+                'seq_stride_s': 0.17,
+                'nb_rnn_layers': 1, 'RNN': True, 'envelope_input': False, 'lr_adam': 0.0005, 'batch_size': 256, 'window_size_s': 0.218,
+                'stride_pool': 1,
+                'stride_conv': 1, 'kernel_conv': 7, 'kernel_pool': 7, 'dilation_conv': 1, 'dilation_pool': 1, 'nb_out': 18, 'time_in_past': 8.5,
+                'estimator_size_memory': 188006400}
+    elif config_name == 'pareto_search_v4':
+        return {'experiment_name': f'pareto_search_15_35_v4_{index}', 'device_train': 'cpu', 'device_val': 'cpu',
+                'device_inference': 'cpu', 'nb_epoch_max': 150, 'max_duration': 257400,
+                'nb_epoch_early_stopping_stop': 100, 'early_stopping_smoothing_factor': 0.1, 'fe': 250,
+                'nb_batch_per_epoch': 1000,
+                'first_layer_dropout': False,
+                'power_features_input': False, 'dropout': 0.5, 'adam_w': 0.01, 'distribution_mode': 0,
+                'classification': True,
+                'reg_balancing': 'none',
+                'split_idx': split_i, 'validation_network_stride': 1, 'nb_conv_layers': 3, 'seq_len': 50,
+                'nb_channel': 31, 'hidden_size': 7,
+                'seq_stride_s': 0.170,
+                'nb_rnn_layers': 1, 'RNN': True, 'envelope_input': False, 'lr_adam': 0.0005, 'batch_size': 256,
+                'window_size_s': 0.218,
+                'stride_pool': 1,
+                'stride_conv': 1, 'kernel_conv': 7, 'kernel_pool': 7, 'dilation_conv': 1, 'dilation_pool': 1,
+                'nb_out': 18, 'time_in_past': 8.5,
+                'estimator_size_memory': 188006400}
+    else:
+        raise ValueError(
+            'Given config dict must either be a json file with .json extension or one of the default names of configuration.')
diff --git a/portiloop_software/portiloop_python/ANN/dataset.py b/portiloop_software/portiloop_python/ANN/dataset.py
new file mode 100644
index 0000000..80164b6
--- /dev/null
+++ b/portiloop_software/portiloop_python/ANN/dataset.py
@@ -0,0 +1,484 @@
+from pathlib import Path
+from random import randint, seed
+import numpy as np
+import pandas as pd
+import logging
+
+from torch.utils.data import Dataset, DataLoader
+from torch.utils.data.sampler import Sampler
+import torch
+from sklearn.model_selection import train_test_split
+
+
+class SignalDataset(Dataset):
+    def __init__(self, exp_config, filename, path, window_size, fe, seq_len, seq_stride, list_subject, len_segment):
+        self.fe = fe
+        self.window_size = window_size
+        self.path_file = Path(path) / filename
+        self.exp_config = exp_config
+
+        self.data = pd.read_csv(self.path_file, header=None).to_numpy()
+        assert list_subject is not None
+        used_sequence = np.hstack(
+            [range(int(s[1]), int(s[2])) for s in list_subject])
+        # 115+30 = nb seconds per sequence in the dataset
+        split_data = np.array(np.split(self.data, int(
+            len(self.data) / (len_segment + 30 * fe))))
+        split_data = split_data[used_sequence]
+        self.data = np.transpose(split_data.reshape(
+            (split_data.shape[0] * split_data.shape[1], 4)))
+
+        assert self.window_size <= len(
+            self.data[0]), "Dataset smaller than window size."
+        self.full_signal = torch.tensor(self.data[0], dtype=torch.float)
+        self.full_envelope = torch.tensor(self.data[1], dtype=torch.float)
+        self.seq_len = seq_len  # 1 means single sample / no sequence ?
+        self.idx_stride = seq_stride
+        self.past_signal_len = self.seq_len * self.idx_stride
+
+        # list of indices that can be sampled:
+        self.indices = [idx for idx in range(len(self.data[0]) - self.window_size)  # all possible idxs in the dataset
+                        if not (self.data[3][idx + self.window_size - 1] < 0  # that are not ending in an unlabeled zone
+                                or idx < self.past_signal_len)]  # and far enough from the beginning to build a sequence up to here
+        total_spindles = np.sum(self.data[3] > self.exp_config['threshold'])
+        logging.debug(
+            f"total number of spindles in this dataset : {total_spindles}")
+
+    def __len__(self):
+        return len(self.indices)
+
+    def __getitem__(self, idx):
+        assert 0 <= idx < len(self), f"Index out of range ({idx}/{len(self)})."
+        idx = self.indices[idx]
+        assert self.data[3][idx + self.window_size -
+                            1] >= 0, f"Bad index: {idx}."
+
+        signal_seq = self.full_signal[idx - (self.past_signal_len - self.idx_stride)                                      :idx + self.window_size].unfold(0, self.window_size, self.idx_stride)
+        envelope_seq = self.full_envelope[idx - (self.past_signal_len - self.idx_stride)                                          :idx + self.window_size].unfold(0, self.window_size, self.idx_stride)
+
+        ratio_pf = torch.tensor(
+            self.data[2][idx + self.window_size - 1], dtype=torch.float)
+        label = torch.tensor(
+            self.data[3][idx + self.window_size - 1], dtype=torch.float)
+
+        return signal_seq, envelope_seq, ratio_pf, label
+
+    def is_spindle(self, idx):
+        assert 0 <= idx <= len(
+            self), f"Index out of range ({idx}/{len(self)})."
+        idx = self.indices[idx]
+        return True if (self.data[3][idx + self.window_size - 1] > self.exp_config['threshold']) else False
+
+
+class UnlabelledSignalDatasetSingleSegment(Dataset):
+    """
+    Caution: this dataset does not sample sequences, but single windows
+    """
+
+    def __init__(self, unlabelled_segment, window_size):
+        self.window_size = window_size
+        self.full_signal = torch.tensor(
+            unlabelled_segment, dtype=torch.float).squeeze()
+        assert len(
+            self.full_signal.shape) == 1, f"Segment has more than one dimension: {self.full_signal.shape}"
+        assert self.window_size <= len(
+            self.full_signal), "Segment smaller than window size."
+        self.seq_len = 1  # 1 means single sample / no sequence ?
+        self.idx_stride = 1
+        self.past_signal_len = self.seq_len * self.idx_stride
+
+        # list of indices that can be sampled:
+        self.indices = [idx for idx in range(len(self.full_signal) - self.window_size)  # all possible idxs in the dataset
+                        if (not idx < self.past_signal_len)]  # far enough from the beginning to build a sequence up to here
+
+    def __len__(self):
+        return len(self.indices)
+
+    def __getitem__(self, idx):
+        assert 0 <= idx < len(self), f"Index out of range ({idx}/{len(self)})."
+        idx = self.indices[idx]
+        signal_seq = self.full_signal[idx:idx +
+                                      self.window_size].unfold(0, self.window_size, 1)
+        true_idx = idx + self.window_size
+        return signal_seq, true_idx
+
+
+def get_class_idxs(dataset, distribution_mode):
+    """
+    Directly outputs idx_true and idx_false arrays
+    """
+    length_dataset = len(dataset)
+
+    nb_true = 0
+    nb_false = 0
+
+    idx_true = []
+    idx_false = []
+
+    for i in range(length_dataset):
+        is_spindle = dataset.is_spindle(i)
+        if is_spindle or distribution_mode == 1:
+            nb_true += 1
+            idx_true.append(i)
+        else:
+            nb_false += 1
+            idx_false.append(i)
+
+    assert len(dataset) == nb_true + nb_false, f"Bad length dataset"
+
+    return np.array(idx_true), np.array(idx_false)
+
+
+# Sampler avec liste et sans rand liste
+
+class RandomSampler(Sampler):
+    """
+    Samples elements randomly and evenly between the two classes.
+    The sampling happens WITH replacement.
+    __iter__ stops after an arbitrary number of iterations = batch_size_list * nb_batch
+    Arguments:
+      idx_true: np.array
+      idx_false: np.array
+      batch_size (int)
+      nb_batch (int, optional): number of iteration before end of __iter__(), this defaults to len(data_source)
+    """
+
+    def __init__(self, idx_true, idx_false, batch_size, distribution_mode, nb_batch):
+        self.idx_true = idx_true
+        self.idx_false = idx_false
+        self.nb_true = self.idx_true.size
+        self.nb_false = self.idx_false.size
+        self.length = nb_batch * batch_size
+        self.distribution_mode = distribution_mode
+
+    def __iter__(self):
+        global precision_validation_factor
+        global recall_validation_factor
+        cur_iter = 0
+        seed()
+        # epsilon = 1e-7 proba = float(0.5 + 0.5 * (precision_validation_factor - recall_validation_factor) / (precision_validation_factor +
+        # recall_validation_factor + epsilon))
+        proba = 0.5
+        if self.distribution_mode == 1:
+            proba = 1
+        logging.debug(f"proba: {proba}")
+
+        while cur_iter < self.length:
+            cur_iter += 1
+            sample_class = np.random.choice([0, 1], p=[1 - proba, proba])
+            if sample_class:  # sample true
+                idx_file = randint(0, self.nb_true - 1)
+                idx_res = self.idx_true[idx_file]
+            else:  # sample false
+                idx_file = randint(0, self.nb_false - 1)
+                idx_res = self.idx_false[idx_file]
+
+            yield idx_res
+
+    def __len__(self):
+        return self.length
+
+
+# Sampler validation
+
+class ValidationSampler(Sampler):
+    """
+    network_stride (int >= 1, default: 1): divides the size of the dataset (and of the batch) by striding further than 1
+    """
+
+    def __init__(self, data_source, seq_stride, nb_segment, len_segment, network_stride):
+        network_stride = int(network_stride)
+        assert network_stride >= 1
+        self.network_stride = network_stride
+        self.seq_stride = seq_stride
+        self.data = data_source
+        self.nb_segment = nb_segment
+        self.len_segment = len_segment
+
+    def __iter__(self):
+        seed()
+        # len sequence = 115 s + add the 15 first s?
+        batches_per_segment = self.len_segment // self.seq_stride
+        cursor_batch = 0
+        while cursor_batch < batches_per_segment:
+            for i in range(self.nb_segment):
+                for j in range(0, (self.seq_stride // self.network_stride) * self.network_stride, self.network_stride):
+                    cur_idx = i * self.len_segment + j + cursor_batch * self.seq_stride
+                    # print(f"i:{i}, j:{j}, self.len_segment:{self.len_segment}, cursor_batch:{cursor_batch}, self.seq_stride:{self.seq_stride}, cur_idx:{cur_idx}")
+                    yield cur_idx
+            cursor_batch += 1
+
+    def __len__(self):
+        assert False
+        # return len(self.data)
+        # return len(self.data_source)
+
+
+def generate_label_distribution_and_lds(dataset, kernel_size=5, kernel_std=2.0, nb_bins=100, reweight='inv_sqrt'):
+    """
+    Returns:
+        distribution: the distribution of labels in the dataset
+        lds: the same distribution, smoothed with a gaussian kernel
+    """
+
+    weights = torch.tensor([0.3252, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0069, 0.0163,
+                            0.0000, 0.0366, 0.0000, 0.0179, 0.0000, 0.0076, 0.0444, 0.0176, 0.0025,
+                            0.0056, 0.0000, 0.0416, 0.0039, 0.0000, 0.0000, 0.0000, 0.0171, 0.0000,
+                            0.0000, 0.0042, 0.0114, 0.0209, 0.0023, 0.0036, 0.0106, 0.0241, 0.0034,
+                            0.0000, 0.0056, 0.0000, 0.0029, 0.0241, 0.0076, 0.0027, 0.0012, 0.0000,
+                            0.0166, 0.0028, 0.0000, 0.0000, 0.0000, 0.0197, 0.0000, 0.0000, 0.0021,
+                            0.0054, 0.0191, 0.0014, 0.0023, 0.0074, 0.0000, 0.0186, 0.0000, 0.0088,
+                            0.0000, 0.0032, 0.0135, 0.0069, 0.0029, 0.0016, 0.0164, 0.0068, 0.0022,
+                            0.0000, 0.0000, 0.0000, 0.0191, 0.0000, 0.0000, 0.0017, 0.0082, 0.0181,
+                            0.0019, 0.0038, 0.0064, 0.0000, 0.0133, 0.0000, 0.0069, 0.0000, 0.0025,
+                            0.0186, 0.0076, 0.0031, 0.0016, 0.0218, 0.0105, 0.0049, 0.0000, 0.0000,
+                            0.0246], dtype=torch.float64)
+
+    lds = None
+    dist = None
+    bins = None
+    return weights, dist, lds, bins
+
+    # TODO: remove before ?????
+
+    dataset_len = len(dataset)
+    logging.debug(
+        f"Length of the dataset passed to generate_label_distribution_and_lds: {dataset_len}")
+    logging.debug(f"kernel_size: {kernel_size}")
+    logging.debug(f"kernel_std: {kernel_std}")
+    logging.debug(f"Generating empirical distribution...")
+
+    tab = np.array([dataset[i][3].item() for i in range(dataset_len)])
+    tab = np.around(tab, decimals=5)
+    elts = np.unique(tab)
+    logging.debug(f"all labels: {elts}")
+    dist, bins = np.histogram(
+        tab, bins=nb_bins, density=False, range=(0.0, 1.0))
+
+    # dist, bins = np.histogram([dataset[i][3].item() for i in range(dataset_len)], bins=nb_bins, density=False, range=(0.0, 1.0))
+
+    logging.debug(f"dist: {dist}")
+
+    # kernel = get_lds_kernel(kernel_size, kernel_std)
+    # lds = convolve1d(dist, weights=kernel, mode='constant')
+
+    lds = gaussian_filter1d(input=dist, sigma=kernel_std, axis=- 1,
+                            order=0, output=None, mode='reflect', cval=0.0, truncate=4.0)
+
+    weights = np.sqrt(lds) if reweight == 'inv_sqrt' else lds
+    # scaling = len(weights) / np.sum(weights)  # not the same implementation as in the original repo
+    scaling = 1.0 / np.sum(weights)
+    weights = weights * scaling
+
+    return weights, dist, lds, bins
+
+
+class LabelDistributionSmoothing:
+    def __init__(self, c=1.0, dataset=None, weights=None, kernel_size=5, kernel_std=2.0, nb_bins=100, weighting_mode="inv_sqrt"):
+        """
+        If provided, lds_distribution must be a numpy.array representing a density over [0.0, 1.0] (e.g. first element of a numpy.histogram)
+        When lds_distribution is provided, it overrides everything else
+        c is the scaling constant for lds weights
+        weighting_mode can be 'inv' or 'inv_sqrt'
+        """
+        assert dataset is not None or weights is not None, "Either a dataset or weights must be provided"
+        self.distribution = None
+        self.bins = None
+        self.lds_distribution = None
+        if weights is None:
+            self.weights, self.distribution, self.lds_distribution, self.bins = generate_label_distribution_and_lds(dataset, kernel_size, kernel_std,
+                                                                                                                    nb_bins, weighting_mode)
+            logging.debug(f"self.distribution: {self.weights}")
+            logging.debug(f"self.lds_distribution: {self.weights}")
+        else:
+            self.weights = weights
+        self.nb_bins = len(self.weights)
+        self.bin_width = 1.0 / self.nb_bins
+        self.c = c
+        logging.debug(
+            f"The LDS distribution has {self.nb_bins} bins of width {self.bin_width}")
+        self.weights = torch.tensor(self.weights)
+
+        logging.debug(f"self.weights: {self.weights}")
+
+    def lds_weights_batch(self, batch_labels):
+        device = batch_labels.device
+        if self.weights.device != device:
+            self.weights = self.weights.to(device)
+        last_bin = 1.0 - self.bin_width
+        batch_idxs = torch.minimum(batch_labels, torch.ones_like(
+            batch_labels) * last_bin) / self.bin_width  # FIXME : double check
+        batch_idxs = batch_idxs.floor().long()
+        res = 1.0 / self.weights[batch_idxs]
+        return res
+
+    def __str__(self):
+        return f"LDS nb_bins: {self.nb_bins}\nbins: {self.bins}\ndistribution: {self.distribution}\nlds_distribution: {self.lds_distribution}\nweights: {self.weights} "
+
+
+def generate_dataloader(data_config, exp_config, window_size, fe, seq_len, seq_stride, distribution_mode, batch_size, nb_batch_per_epoch, classification, split_i,
+                        network_stride):
+    all_subject = pd.read_csv(
+        Path(data_config['path_dataset']) / data_config['subject_list'], header=None, delim_whitespace=True).to_numpy()
+    test_subject = None
+    if exp_config['phase'] == 'full':
+        p1_subject = pd.read_csv(Path(
+            data_config['path_dataset']) / data_config['subject_list_p1'], header=None, delim_whitespace=True).to_numpy()
+        p2_subject = pd.read_csv(Path(
+            data_config['path_dataset']) / data_config['subject_list_p2'], header=None, delim_whitespace=True).to_numpy()
+        train_subject_p1, validation_subject_p1 = train_test_split(
+            p1_subject, train_size=0.8, random_state=split_i)
+        if exp_config['test']:
+            test_subject_p1, validation_subject_p1 = train_test_split(
+                validation_subject_p1, train_size=0.5, random_state=split_i)
+        train_subject_p2, validation_subject_p2 = train_test_split(
+            p2_subject, train_size=0.8, random_state=split_i)
+        if exp_config['test']:
+            test_subject_p2, validation_subject_p2 = train_test_split(
+                validation_subject_p2, train_size=0.5, random_state=split_i)
+        train_subject = np.array(
+            [s for s in all_subject if s[0] in train_subject_p1[:, 0] or s[0] in train_subject_p2[:, 0]]).squeeze()
+        if exp_config['test']:
+            test_subject = np.array(
+                [s for s in all_subject if s[0] in test_subject_p1[:, 0] or s[0] in test_subject_p2[:, 0]]).squeeze()
+        validation_subject = np.array(
+            [s for s in all_subject if s[0] in validation_subject_p1[:, 0] or s[0] in validation_subject_p2[:, 0]]).squeeze()
+    else:
+        train_subject, validation_subject = train_test_split(
+            all_subject, train_size=0.8, random_state=split_i)
+        if exp_config['test']:
+            test_subject, validation_subject = train_test_split(
+                validation_subject, train_size=0.5, random_state=split_i)
+    logging.debug(f"Subjects in training : {train_subject[:, 0]}")
+    logging.debug(f"Subjects in validation : {validation_subject[:, 0]}")
+    if exp_config['test']:
+        logging.debug(f"Subjects in test : {test_subject[:, 0]}")
+
+    len_segment = exp_config['len_segment'] * fe
+    train_loader = None
+    validation_loader = None
+    test_loader = None
+    batch_size_validation = None
+    batch_size_test = None
+    filename = data_config['filename_classification_dataset'] if classification else data_config['filename_regression_dataset']
+
+    if seq_len is not None:
+        nb_segment_validation = len(
+            np.hstack([range(int(s[1]), int(s[2])) for s in validation_subject]))
+        batch_size_validation = len(list(range(
+            0, (seq_stride // network_stride) * network_stride, network_stride))) * nb_segment_validation
+
+        ds_train = SignalDataset(
+            exp_config=exp_config,
+            filename=filename,
+            path=data_config['path_dataset'],
+            window_size=window_size,
+            fe=fe,
+            seq_len=seq_len,
+            seq_stride=seq_stride,
+            list_subject=train_subject,
+            len_segment=len_segment)
+
+        ds_validation = SignalDataset(
+            exp_config=exp_config,
+            filename=filename,
+            path=data_config['path_dataset'],
+            window_size=window_size,
+            fe=fe,
+            seq_len=1,
+            seq_stride=1,  # just to be sure, fixed value
+            list_subject=validation_subject,
+            len_segment=len_segment)
+        idx_true, idx_false = get_class_idxs(ds_train, distribution_mode)
+        samp_train = RandomSampler(
+            idx_true=idx_true,
+            idx_false=idx_false,
+            batch_size=batch_size,
+            nb_batch=nb_batch_per_epoch,
+            distribution_mode=distribution_mode)
+
+        samp_validation = ValidationSampler(
+            ds_validation,
+            seq_stride=seq_stride,
+            len_segment=len_segment,
+            nb_segment=nb_segment_validation,
+            network_stride=network_stride)
+        train_loader = DataLoader(
+            ds_train,
+            batch_size=batch_size,
+            sampler=samp_train,
+            shuffle=False,
+            num_workers=0,
+            pin_memory=True)
+
+        validation_loader = DataLoader(
+            ds_validation,
+            batch_size=batch_size_validation,
+            sampler=samp_validation,
+            num_workers=0,
+            pin_memory=True,
+            shuffle=False)
+    else:
+        nb_segment_test = len(
+            np.hstack([range(int(s[1]), int(s[2])) for s in test_subject]))
+        batch_size_test = len(list(range(
+            0, (seq_stride // network_stride) * network_stride, network_stride))) * nb_segment_test
+
+        ds_test = SignalDataset(
+            exp_config=exp_config,
+            filename=filename,
+            path=data_config['path_dataset'],
+            window_size=window_size,
+            fe=fe,
+            seq_len=1,
+            seq_stride=1,  # just to be sure, fixed value
+            list_subject=test_subject,
+            len_segment=len_segment)
+
+        samp_test = ValidationSampler(
+            ds_test,
+            seq_stride=seq_stride,
+            len_segment=len_segment,
+            nb_segment=nb_segment_test,
+            network_stride=network_stride)
+
+        test_loader = DataLoader(
+            ds_test,
+            batch_size=batch_size_test,
+            sampler=samp_test,
+            num_workers=0,
+            pin_memory=True,
+            shuffle=False)
+
+    return train_loader, validation_loader, batch_size_validation, test_loader, batch_size_test, test_subject
+
+
+def generate_dataloader_unlabelled_offline(unlabelled_segment,
+                                           window_size,
+                                           seq_stride,
+                                           network_stride):
+    nb_segment_test = 1
+    batch_size_test = len(list(range(0, (seq_stride // network_stride)
+                          * network_stride, network_stride))) * nb_segment_test
+    unlabelled_segment = torch.tensor(
+        unlabelled_segment, dtype=torch.float).squeeze()
+    assert len(
+        unlabelled_segment.shape) == 1, f"Segment has more than one dimension: {unlabelled_segment.shape}"
+    len_segment = len(unlabelled_segment)
+    ds_test = UnlabelledSignalDatasetSingleSegment(unlabelled_segment=unlabelled_segment,
+                                                   window_size=window_size)
+    samp_test = ValidationSampler(ds_test,
+                                  seq_stride=seq_stride,
+                                  # because we don't have additional data at the end on the signal here
+                                  len_segment=len_segment-window_size,
+                                  nb_segment=nb_segment_test,
+                                  network_stride=network_stride)
+
+    test_loader = DataLoader(ds_test,
+                             batch_size=batch_size_test,
+                             sampler=samp_test,
+                             num_workers=0,
+                             pin_memory=True,
+                             shuffle=False)
+
+    return test_loader, batch_size_test
diff --git a/portiloop_software/portiloop_python/ANN/nn_utils.py b/portiloop_software/portiloop_python/ANN/nn_utils.py
new file mode 100644
index 0000000..8009085
--- /dev/null
+++ b/portiloop_software/portiloop_python/ANN/nn_utils.py
@@ -0,0 +1,185 @@
+'''
+Script containing Utils for training an ANN for the Portiloop
+'''
+
+import torch
+import os
+import wandb
+import copy
+import logging
+from scipy.ndimage import gaussian_filter1d
+
+
+class LoggerWandb:
+    def __init__(self, experiment_name, c_dict, project_name, data_config):
+        self.data_config = data_config
+        self.best_model = None
+        self.experiment_name = experiment_name
+        os.environ['WANDB_API_KEY'] = "cd105554ccdfeee0bbe69c175ba0c14ed41f6e00"
+        self.wandb_run = wandb.init(project=project_name, entity="portiloop", id=experiment_name, resume="allow",
+                                    config=c_dict, reinit=True)
+
+    def log(self,
+            accuracy_train,
+            loss_train,
+            accuracy_validation,
+            loss_validation,
+            f1_validation,
+            precision_validation,
+            recall_validation,
+            best_epoch,
+            best_model,
+            loss_early_stopping,
+            best_epoch_early_stopping,
+            best_model_accuracy_validation,
+            best_model_f1_score_validation,
+            best_model_precision_validation,
+            best_model_recall_validation,
+            best_model_loss_validation,
+            best_model_on_loss_accuracy_validation,
+            best_model_on_loss_f1_score_validation,
+            best_model_on_loss_precision_validation,
+            best_model_on_loss_recall_validation,
+            best_model_on_loss_loss_validation,
+            updated_model=False,
+            ):
+        self.best_model = best_model
+        self.wandb_run.log({
+            "accuracy_train": accuracy_train,
+            "loss_train": loss_train,
+            "accuracy_validation": accuracy_validation,
+            "loss_validation": loss_validation,
+            "f1_validation": f1_validation,
+            "precision_validation": precision_validation,
+            "recall_validation": recall_validation,
+            "loss_early_stopping": loss_early_stopping,
+        })
+        self.wandb_run.summary["best_epoch"] = best_epoch
+        self.wandb_run.summary["best_epoch_early_stopping"] = best_epoch_early_stopping
+        self.wandb_run.summary["best_model_f1_score_validation"] = best_model_f1_score_validation
+        self.wandb_run.summary["best_model_precision_validation"] = best_model_precision_validation
+        self.wandb_run.summary["best_model_recall_validation"] = best_model_recall_validation
+        self.wandb_run.summary["best_model_loss_validation"] = best_model_loss_validation
+        self.wandb_run.summary["best_model_accuracy_validation"] = best_model_accuracy_validation
+        self.wandb_run.summary["best_model_on_loss_f1_score_validation"] = best_model_on_loss_f1_score_validation
+        self.wandb_run.summary["best_model_on_loss_precision_validation"] = best_model_on_loss_precision_validation
+        self.wandb_run.summary["best_model_on_loss_recall_validation"] = best_model_on_loss_recall_validation
+        self.wandb_run.summary["best_model_on_loss_loss_validation"] = best_model_on_loss_loss_validation
+        self.wandb_run.summary["best_model_on_loss_accuracy_validation"] = best_model_on_loss_accuracy_validation
+        if updated_model:
+            self.wandb_run.save(os.path.join(
+                self.data_config['path_dataset'], self.experiment_name), policy="live", base_path=self.data_config['path_dataset'])
+            self.wandb_run.save(os.path.join(
+                self.data_config['path_dataset'], self.experiment_name + "_on_loss"), policy="live", base_path=self.data_config['path_dataset'])
+
+    def __del__(self):
+        self.wandb_run.finish()
+
+    def restore(self, classif):
+        if classif:
+            self.wandb_run.restore(self.experiment_name,
+                                   root=self.data_config['path_dataset'])
+        else:
+            self.wandb_run.restore(
+                self.experiment_name + "_on_loss", root=self.data_config['path_dataset'])
+
+
+def f1_loss(output, batch_labels):
+    # logging.debug(f"output in loss : {output[:,1]}")
+    # logging.debug(f"batch_labels in loss : {batch_labels}")
+    y_pred = output
+    tp = (batch_labels * y_pred).sum().to(torch.float32)
+    tn = ((1 - batch_labels) * (1 - y_pred)).sum().to(torch.float32).item()
+    fp = ((1 - batch_labels) * y_pred).sum().to(torch.float32)
+    fn = (batch_labels * (1 - y_pred)).sum().to(torch.float32)
+
+    epsilon = 1e-7
+    F1_class1 = 2 * tp / (2 * tp + fp + fn + epsilon)
+    F1_class0 = 2 * tn / (2 * tn + fn + fp + epsilon)
+    New_F1 = (F1_class1 + F1_class0) / 2
+    return 1 - New_F1
+
+
+def get_metrics(tp, fp, fn):
+    tp_sum = tp.sum().to(torch.float32).item()
+    fp_sum = fp.sum().to(torch.float32).item()
+    fn_sum = fn.sum().to(torch.float32).item()
+    epsilon = 1e-7
+
+    precision = tp_sum / (tp_sum + fp_sum + epsilon)
+    recall = tp_sum / (tp_sum + fn_sum + epsilon)
+
+    f1 = 2 * (precision * recall) / (precision + recall + epsilon)
+
+    return f1, precision, recall
+
+
+def get_lds_kernel(ks, sigma):
+    half_ks = (ks - 1) // 2
+    base_kernel = [0.] * half_ks + [1.] + [0.] * half_ks
+    kernel_window = gaussian_filter1d(
+        base_kernel, sigma=sigma) / max(gaussian_filter1d(base_kernel, sigma=sigma))
+    return kernel_window
+
+
+class SurpriseReweighting:
+    """
+    Custom reweighting Yann
+    """
+
+    def __init__(self, weights=None, nb_bins=100, alpha=1e-3):
+        if weights is None:
+            self.weights = [1.0, ] * nb_bins
+            self.weights = torch.tensor(self.weights)
+            self.weights = self.weights / torch.sum(self.weights)
+        else:
+            self.weights = weights
+        self.weights = self.weights.detach()
+        self.nb_bins = len(self.weights)
+        self.bin_width = 1.0 / self.nb_bins
+        self.alpha = alpha
+        logging.debug(
+            f"The SR distribution has {self.nb_bins} bins of width {self.bin_width}")
+        logging.debug(f"Initial self.weights: {self.weights}")
+
+    def update_and_get_weighted_loss(self, batch_labels, unweighted_loss):
+        device = batch_labels.device
+        if self.weights.device != device:
+            logging.debug(f"Moving SR weights to {device}")
+            self.weights = self.weights.to(device)
+        last_bin = 1.0 - self.bin_width
+        batch_idxs = torch.minimum(batch_labels, torch.ones_like(
+            batch_labels) * last_bin) / self.bin_width  # FIXME : double check
+        batch_idxs = batch_idxs.floor().long()
+        self.weights = self.weights.detach()  # ensure no gradients
+        weights = copy.deepcopy(self.weights[batch_idxs])
+        res = unweighted_loss * weights
+        with torch.no_grad():
+            abs_loss = torch.abs(unweighted_loss)
+
+            # compute the mean loss per idx
+
+            num = torch.zeros(self.nb_bins, device=device)
+            num = num.index_add(0, batch_idxs, abs_loss)
+            bincount = torch.bincount(batch_idxs, minlength=self.nb_bins)
+            div = bincount.float()
+            idx_unchanged = bincount == 0
+            idx_changed = bincount != 0
+            div[idx_unchanged] = 1.0
+            mean_loss_per_idx_normalized = num / div
+            sum_changed_weights = torch.sum(self.weights[idx_changed])
+            sum_mean_loss = torch.sum(
+                mean_loss_per_idx_normalized[idx_changed])
+            mean_loss_per_idx_normalized[idx_changed] = mean_loss_per_idx_normalized[idx_changed] * \
+                sum_changed_weights / sum_mean_loss
+            # logging.debug(f"old self.weights: {self.weights}")
+            self.weights[idx_changed] = (1.0 - self.alpha) * self.weights[idx_changed] + \
+                self.alpha * mean_loss_per_idx_normalized[idx_changed]
+            self.weights /= torch.sum(self.weights)  # force sum to 1
+            # logging.debug(f"unique_idx: {unique_idx}")
+            # logging.debug(f"new self.weights: {self.weights}")
+            # logging.debug(f"new torch.sum(self.weights): {torch.sum(self.weights)}")
+        return torch.sqrt(res * self.nb_bins)
+
+    def __str__(self):
+        return f"LDS nb_bins: {self.nb_bins}\nweights: {self.weights}"
diff --git a/portiloop_software/portiloop_python/ANN/portiloop_detector_training.py b/portiloop_software/portiloop_python/ANN/portiloop_detector_training.py
deleted file mode 100644
index 082520a..0000000
--- a/portiloop_software/portiloop_python/ANN/portiloop_detector_training.py
+++ /dev/null
@@ -1,1433 +0,0 @@
-"""
-Main script for training an ANN.
-"""
-
-# all imports
-
-import copy
-import logging
-import os
-import time
-from argparse import ArgumentParser
-from pathlib import Path
-from random import randint, seed
-
-import numpy as np
-import pandas as pd
-import torch
-import torch.nn as nn
-import torch.optim as optim
-from sklearn.model_selection import train_test_split
-from torch.nn import functional as F
-from torch.utils.data import Dataset, DataLoader
-from torch.utils.data.sampler import Sampler
-
-import wandb
-
-from scipy.ndimage import gaussian_filter1d, convolve1d
-
-from portiloop_software.portiloop_python.Utils.utils import out_dim
-
-path_dataset = Path(__file__).absolute().parent.parent.parent / 'dataset'
-recall_validation_factor = 0.5
-precision_validation_factor = 0.5
-
-# hyperparameters
-
-# batch_size_list = [64, 64, 64, 128, 128, 128, 256, 256, 256]
-# lr_adam_list = [0.0003, 0.0005, 0.0009]
-# hidden_size_list = [2, 5, 10, 15, 20]
-
-LEN_SEGMENT = 115  # in seconds
-
-
-# all classes and functions:
-
-class SignalDataset(Dataset):
-    def __init__(self, filename, path, window_size, fe, seq_len, seq_stride, list_subject, len_segment):
-        self.fe = fe
-        self.window_size = window_size
-        self.path_file = Path(path) / filename
-
-        self.data = pd.read_csv(self.path_file, header=None).to_numpy()
-        assert list_subject is not None
-        used_sequence = np.hstack([range(int(s[1]), int(s[2])) for s in list_subject])
-        split_data = np.array(np.split(self.data, int(len(self.data) / (len_segment + 30 * fe))))  # 115+30 = nb seconds per sequence in the dataset
-        split_data = split_data[used_sequence]
-        self.data = np.transpose(split_data.reshape((split_data.shape[0] * split_data.shape[1], 4)))
-
-        assert self.window_size <= len(self.data[0]), "Dataset smaller than window size."
-        self.full_signal = torch.tensor(self.data[0], dtype=torch.float)
-        self.full_envelope = torch.tensor(self.data[1], dtype=torch.float)
-        self.seq_len = seq_len  # 1 means single sample / no sequence ?
-        self.idx_stride = seq_stride
-        self.past_signal_len = self.seq_len * self.idx_stride
-
-        # list of indices that can be sampled:
-        self.indices = [idx for idx in range(len(self.data[0]) - self.window_size)  # all possible idxs in the dataset
-                        if not (self.data[3][idx + self.window_size - 1] < 0  # that are not ending in an unlabeled zone
-                                or idx < self.past_signal_len)]  # and far enough from the beginning to build a sequence up to here
-        total_spindles = np.sum(self.data[3] > THRESHOLD)
-        logging.debug(f"total number of spindles in this dataset : {total_spindles}")
-
-    def __len__(self):
-        return len(self.indices)
-
-    def __getitem__(self, idx):
-        assert 0 <= idx < len(self), f"Index out of range ({idx}/{len(self)})."
-        idx = self.indices[idx]
-        assert self.data[3][idx + self.window_size - 1] >= 0, f"Bad index: {idx}."
-
-        signal_seq = self.full_signal[idx - (self.past_signal_len - self.idx_stride):idx + self.window_size].unfold(0, self.window_size, self.idx_stride)
-        envelope_seq = self.full_envelope[idx - (self.past_signal_len - self.idx_stride):idx + self.window_size].unfold(0, self.window_size, self.idx_stride)
-
-        ratio_pf = torch.tensor(self.data[2][idx + self.window_size - 1], dtype=torch.float)
-        label = torch.tensor(self.data[3][idx + self.window_size - 1], dtype=torch.float)
-
-        return signal_seq, envelope_seq, ratio_pf, label
-
-    def is_spindle(self, idx):
-        assert 0 <= idx <= len(self), f"Index out of range ({idx}/{len(self)})."
-        idx = self.indices[idx]
-        return True if (self.data[3][idx + self.window_size - 1] > THRESHOLD) else False
-
-
-class UnlabelledSignalDatasetSingleSegment(Dataset):
-    """
-    Caution: this dataset does not sample sequences, but single windows
-    """
-    def __init__(self, unlabelled_segment, window_size):
-        self.window_size = window_size
-        self.full_signal = torch.tensor(unlabelled_segment, dtype=torch.float).squeeze()
-        assert len(self.full_signal.shape) == 1, f"Segment has more than one dimension: {self.full_signal.shape}"
-        assert self.window_size <= len(self.full_signal), "Segment smaller than window size."
-        self.seq_len = 1  # 1 means single sample / no sequence ?
-        self.idx_stride = 1
-        self.past_signal_len = self.seq_len * self.idx_stride
-
-        # list of indices that can be sampled:
-        self.indices = [idx for idx in range(len(self.full_signal) - self.window_size)  # all possible idxs in the dataset
-                        if (not idx < self.past_signal_len)]  # far enough from the beginning to build a sequence up to here
-
-    def __len__(self):
-        return len(self.indices)
-
-    def __getitem__(self, idx):
-        assert 0 <= idx < len(self), f"Index out of range ({idx}/{len(self)})."
-        idx = self.indices[idx]
-        signal_seq = self.full_signal[idx:idx + self.window_size].unfold(0, self.window_size, 1)
-        true_idx = idx + self.window_size
-        return signal_seq, true_idx
-
-
-def get_class_idxs(dataset, distribution_mode):
-    """
-    Directly outputs idx_true and idx_false arrays
-    """
-    length_dataset = len(dataset)
-
-    nb_true = 0
-    nb_false = 0
-
-    idx_true = []
-    idx_false = []
-
-    for i in range(length_dataset):
-        is_spindle = dataset.is_spindle(i)
-        if is_spindle or distribution_mode == 1:
-            nb_true += 1
-            idx_true.append(i)
-        else:
-            nb_false += 1
-            idx_false.append(i)
-
-    assert len(dataset) == nb_true + nb_false, f"Bad length dataset"
-
-    return np.array(idx_true), np.array(idx_false)
-
-
-# Sampler avec liste et sans rand liste
-
-class RandomSampler(Sampler):
-    """
-    Samples elements randomly and evenly between the two classes.
-    The sampling happens WITH replacement.
-    __iter__ stops after an arbitrary number of iterations = batch_size_list * nb_batch
-    Arguments:
-      idx_true: np.array
-      idx_false: np.array
-      batch_size (int)
-      nb_batch (int, optional): number of iteration before end of __iter__(), this defaults to len(data_source)
-    """
-
-    def __init__(self, idx_true, idx_false, batch_size, distribution_mode, nb_batch):
-        self.idx_true = idx_true
-        self.idx_false = idx_false
-        self.nb_true = self.idx_true.size
-        self.nb_false = self.idx_false.size
-        self.length = nb_batch * batch_size
-        self.distribution_mode = distribution_mode
-
-    def __iter__(self):
-        global precision_validation_factor
-        global recall_validation_factor
-        cur_iter = 0
-        seed()
-        # epsilon = 1e-7 proba = float(0.5 + 0.5 * (precision_validation_factor - recall_validation_factor) / (precision_validation_factor +
-        # recall_validation_factor + epsilon))
-        proba = 0.5
-        if self.distribution_mode == 1:
-            proba = 1
-        logging.debug(f"proba: {proba}")
-
-        while cur_iter < self.length:
-            cur_iter += 1
-            sample_class = np.random.choice([0, 1], p=[1 - proba, proba])
-            if sample_class:  # sample true
-                idx_file = randint(0, self.nb_true - 1)
-                idx_res = self.idx_true[idx_file]
-            else:  # sample false
-                idx_file = randint(0, self.nb_false - 1)
-                idx_res = self.idx_false[idx_file]
-
-            yield idx_res
-
-    def __len__(self):
-        return self.length
-
-
-# Sampler validation
-
-class ValidationSampler(Sampler):
-    """
-    network_stride (int >= 1, default: 1): divides the size of the dataset (and of the batch) by striding further than 1
-    """
-
-    def __init__(self, data_source, seq_stride, nb_segment, len_segment, network_stride):
-        network_stride = int(network_stride)
-        assert network_stride >= 1
-        self.network_stride = network_stride
-        self.seq_stride = seq_stride
-        self.data = data_source
-        self.nb_segment = nb_segment
-        self.len_segment = len_segment
-
-    def __iter__(self):
-        seed()
-        batches_per_segment = self.len_segment // self.seq_stride  # len sequence = 115 s + add the 15 first s?
-        cursor_batch = 0
-        while cursor_batch < batches_per_segment:
-            for i in range(self.nb_segment):
-                for j in range(0, (self.seq_stride // self.network_stride) * self.network_stride, self.network_stride):
-                    cur_idx = i * self.len_segment + j + cursor_batch * self.seq_stride
-                    # print(f"i:{i}, j:{j}, self.len_segment:{self.len_segment}, cursor_batch:{cursor_batch}, self.seq_stride:{self.seq_stride}, cur_idx:{cur_idx}")
-                    yield cur_idx
-            cursor_batch += 1
-
-    def __len__(self):
-        assert False
-        # return len(self.data)
-        # return len(self.data_source)
-
-
-class ConvPoolModule(nn.Module):
-    def __init__(self,
-                 in_channels,
-                 out_channel,
-                 kernel_conv,
-                 stride_conv,
-                 conv_padding,
-                 dilation_conv,
-                 kernel_pool,
-                 stride_pool,
-                 pool_padding,
-                 dilation_pool,
-                 dropout_p):
-        super(ConvPoolModule, self).__init__()
-
-        self.conv = nn.Conv1d(in_channels=in_channels,
-                              out_channels=out_channel,
-                              kernel_size=kernel_conv,
-                              stride=stride_conv,
-                              padding=conv_padding,
-                              dilation=dilation_conv)
-        self.pool = nn.MaxPool1d(kernel_size=kernel_pool,
-                                 stride=stride_pool,
-                                 padding=pool_padding,
-                                 dilation=dilation_pool)
-        self.dropout = nn.Dropout(dropout_p)
-
-    def forward(self, input_f):
-        x, max_value = input_f
-        x = F.relu(self.conv(x))
-        x = self.pool(x)
-        max_temp = torch.max(abs(x))
-        if max_temp > max_value:
-            logging.debug(f"max_value = {max_temp}")
-            max_value = max_temp
-        return self.dropout(x), max_value
-
-
-class FcModule(nn.Module):
-    def __init__(self,
-                 in_features,
-                 out_features,
-                 dropout_p):
-        super(FcModule, self).__init__()
-
-        self.fc = nn.Linear(in_features=in_features, out_features=out_features)
-        self.dropout = nn.Dropout(dropout_p)
-
-    def forward(self, x):
-        x = F.relu(self.fc(x))
-        return self.dropout(x)
-
-
-class PortiloopNetwork(nn.Module):
-    def __init__(self, c_dict):
-        super(PortiloopNetwork, self).__init__()
-
-        RNN = c_dict["RNN"]
-        stride_pool = c_dict["stride_pool"]
-        stride_conv = c_dict["stride_conv"]
-        kernel_conv = c_dict["kernel_conv"]
-        kernel_pool = c_dict["kernel_pool"]
-        nb_channel = c_dict["nb_channel"]
-        hidden_size = c_dict["hidden_size"]
-        window_size_s = c_dict["window_size_s"]
-        dropout_p = c_dict["dropout"]
-        dilation_conv = c_dict["dilation_conv"]
-        dilation_pool = c_dict["dilation_pool"]
-        fe = c_dict["fe"]
-        nb_conv_layers = c_dict["nb_conv_layers"]
-        nb_rnn_layers = c_dict["nb_rnn_layers"]
-        first_layer_dropout = c_dict["first_layer_dropout"]
-        self.envelope_input = c_dict["envelope_input"]
-        self.power_features_input = c_dict["power_features_input"]
-        self.classification = c_dict["classification"]
-
-        conv_padding = 0  # int(kernel_conv // 2)
-        pool_padding = 0  # int(kernel_pool // 2)
-        window_size = int(window_size_s * fe)
-        nb_out = window_size
-
-        for _ in range(nb_conv_layers):
-            nb_out = out_dim(nb_out, conv_padding, dilation_conv, kernel_conv, stride_conv)
-            nb_out = out_dim(nb_out, pool_padding, dilation_pool, kernel_pool, stride_pool)
-
-        output_cnn_size = int(nb_channel * nb_out)
-
-        self.RNN = RNN
-        self.first_layer_input1 = ConvPoolModule(in_channels=1,
-                                                 out_channel=nb_channel,
-                                                 kernel_conv=kernel_conv,
-                                                 stride_conv=stride_conv,
-                                                 conv_padding=conv_padding,
-                                                 dilation_conv=dilation_conv,
-                                                 kernel_pool=kernel_pool,
-                                                 stride_pool=stride_pool,
-                                                 pool_padding=pool_padding,
-                                                 dilation_pool=dilation_pool,
-                                                 dropout_p=dropout_p if first_layer_dropout else 0)
-        self.seq_input1 = nn.Sequential(*(ConvPoolModule(in_channels=nb_channel,
-                                                         out_channel=nb_channel,
-                                                         kernel_conv=kernel_conv,
-                                                         stride_conv=stride_conv,
-                                                         conv_padding=conv_padding,
-                                                         dilation_conv=dilation_conv,
-                                                         kernel_pool=kernel_pool,
-                                                         stride_pool=stride_pool,
-                                                         pool_padding=pool_padding,
-                                                         dilation_pool=dilation_pool,
-                                                         dropout_p=dropout_p) for _ in range(nb_conv_layers - 1)))
-        if RNN:
-            self.gru_input1 = nn.GRU(input_size=output_cnn_size,
-                                     hidden_size=hidden_size,
-                                     num_layers=nb_rnn_layers,
-                                     dropout=0,
-                                     batch_first=True)
-        #       fc_size = hidden_size
-        else:
-            self.first_fc_input1 = FcModule(in_features=output_cnn_size, out_features=hidden_size, dropout_p=dropout_p)
-            self.seq_fc_input1 = nn.Sequential(
-                *(FcModule(in_features=hidden_size, out_features=hidden_size, dropout_p=dropout_p) for _ in range(nb_rnn_layers - 1)))
-        if self.envelope_input:
-            self.first_layer_input2 = ConvPoolModule(in_channels=1,
-                                                     out_channel=nb_channel,
-                                                     kernel_conv=kernel_conv,
-                                                     stride_conv=stride_conv,
-                                                     conv_padding=conv_padding,
-                                                     dilation_conv=dilation_conv,
-                                                     kernel_pool=kernel_pool,
-                                                     stride_pool=stride_pool,
-                                                     pool_padding=pool_padding,
-                                                     dilation_pool=dilation_pool,
-                                                     dropout_p=dropout_p if first_layer_dropout else 0)
-            self.seq_input2 = nn.Sequential(*(ConvPoolModule(in_channels=nb_channel,
-                                                             out_channel=nb_channel,
-                                                             kernel_conv=kernel_conv,
-                                                             stride_conv=stride_conv,
-                                                             conv_padding=conv_padding,
-                                                             dilation_conv=dilation_conv,
-                                                             kernel_pool=kernel_pool,
-                                                             stride_pool=stride_pool,
-                                                             pool_padding=pool_padding,
-                                                             dilation_pool=dilation_pool,
-                                                             dropout_p=dropout_p) for _ in range(nb_conv_layers - 1)))
-
-            if RNN:
-                self.gru_input2 = nn.GRU(input_size=output_cnn_size,
-                                         hidden_size=hidden_size,
-                                         num_layers=nb_rnn_layers,
-                                         dropout=0,
-                                         batch_first=True)
-            else:
-                self.first_fc_input2 = FcModule(in_features=output_cnn_size, out_features=hidden_size, dropout_p=dropout_p)
-                self.seq_fc_input2 = nn.Sequential(
-                    *(FcModule(in_features=hidden_size, out_features=hidden_size, dropout_p=dropout_p) for _ in range(nb_rnn_layers - 1)))
-        fc_features = 0
-        fc_features += hidden_size
-        if self.envelope_input:
-            fc_features += hidden_size
-        if self.power_features_input:
-            fc_features += 1
-        out_features = 1
-        self.fc = nn.Linear(in_features=fc_features,  # enveloppe and signal + power features ratio
-                            out_features=out_features)  # probability of being a spindle
-
-    def forward(self, x1, x2, x3, h1, h2, max_value=np.inf):
-        # x1 : input 1 : cleaned signal
-        # x2 : input 2 : envelope
-        # x3 : power features ratio
-        # h1 : gru 1 hidden size
-        # h2 : gru 2 hidden size
-        # max_value (optional) : print the maximal value reach during inference (used to verify if the FPGA implementation precision is enough)
-        (batch_size, sequence_len, features) = x1.shape
-
-        if ABLATION == 1:
-            x1 = copy.deepcopy(x2)
-        elif ABLATION == 2:
-            x2 = copy.deepcopy(x1)
-
-        x1 = x1.view(-1, 1, features)
-        x1, max_value = self.first_layer_input1((x1, max_value))
-        x1, max_value = self.seq_input1((x1, max_value))
-
-        x1 = torch.flatten(x1, start_dim=1, end_dim=-1)
-        hn1 = None
-        if self.RNN:
-            x1 = x1.view(batch_size, sequence_len, -1)
-            x1, hn1 = self.gru_input1(x1, h1)
-            max_temp = torch.max(abs(x1))
-            if max_temp > max_value:
-                logging.debug(f"max_value = {max_temp}")
-                max_value = max_temp
-            x1 = x1[:, -1, :]
-        else:
-            x1 = self.first_fc_input1(x1)
-            x1 = self.seq_fc_input1(x1)
-        x = x1
-        hn2 = None
-        if self.envelope_input:
-            x2 = x2.view(-1, 1, features)
-            x2, max_value = self.first_layer_input2((x2, max_value))
-            x2, max_value = self.seq_input2((x2, max_value))
-
-            x2 = torch.flatten(x2, start_dim=1, end_dim=-1)
-            if self.RNN:
-                x2 = x2.view(batch_size, sequence_len, -1)
-                x2, hn2 = self.gru_input2(x2, h2)
-                max_temp = torch.max(abs(x2))
-                if max_temp > max_value:
-                    logging.debug(f"max_value = {max_temp}")
-                    max_value = max_temp
-                x2 = x2[:, -1, :]
-            else:
-                x2 = self.first_fc_input2(x2)
-                x2 = self.seq_fc_input2(x2)
-            x = torch.cat((x, x2), -1)
-
-        if self.power_features_input:
-            x3 = x3.view(-1, 1)
-            x = torch.cat((x, x3), -1)
-
-        x = self.fc(x)  # output size: 1
-        max_temp = torch.max(abs(x))
-        if max_temp > max_value:
-            logging.debug(f"max_value = {max_temp}")
-            max_value = max_temp
-        x = torch.sigmoid(x)
-
-        return x, hn1, hn2, max_value
-
-
-class LoggerWandb:
-    def __init__(self, experiment_name, c_dict, project_name):
-        self.best_model = None
-        self.experiment_name = experiment_name
-        os.environ['WANDB_API_KEY'] = "cd105554ccdfeee0bbe69c175ba0c14ed41f6e00"
-        self.wandb_run = wandb.init(project=project_name, entity="portiloop", id=experiment_name, resume="allow",
-                                    config=c_dict, reinit=True)
-
-    def log(self,
-            accuracy_train,
-            loss_train,
-            accuracy_validation,
-            loss_validation,
-            f1_validation,
-            precision_validation,
-            recall_validation,
-            best_epoch,
-            best_model,
-            loss_early_stopping,
-            best_epoch_early_stopping,
-            best_model_accuracy_validation,
-            best_model_f1_score_validation,
-            best_model_precision_validation,
-            best_model_recall_validation,
-            best_model_loss_validation,
-            best_model_on_loss_accuracy_validation,
-            best_model_on_loss_f1_score_validation,
-            best_model_on_loss_precision_validation,
-            best_model_on_loss_recall_validation,
-            best_model_on_loss_loss_validation,
-            updated_model=False,
-            ):
-        self.best_model = best_model
-        self.wandb_run.log({
-            "accuracy_train": accuracy_train,
-            "loss_train": loss_train,
-            "accuracy_validation": accuracy_validation,
-            "loss_validation": loss_validation,
-            "f1_validation": f1_validation,
-            "precision_validation": precision_validation,
-            "recall_validation": recall_validation,
-            "loss_early_stopping": loss_early_stopping,
-        })
-        self.wandb_run.summary["best_epoch"] = best_epoch
-        self.wandb_run.summary["best_epoch_early_stopping"] = best_epoch_early_stopping
-        self.wandb_run.summary["best_model_f1_score_validation"] = best_model_f1_score_validation
-        self.wandb_run.summary["best_model_precision_validation"] = best_model_precision_validation
-        self.wandb_run.summary["best_model_recall_validation"] = best_model_recall_validation
-        self.wandb_run.summary["best_model_loss_validation"] = best_model_loss_validation
-        self.wandb_run.summary["best_model_accuracy_validation"] = best_model_accuracy_validation
-        self.wandb_run.summary["best_model_on_loss_f1_score_validation"] = best_model_on_loss_f1_score_validation
-        self.wandb_run.summary["best_model_on_loss_precision_validation"] = best_model_on_loss_precision_validation
-        self.wandb_run.summary["best_model_on_loss_recall_validation"] = best_model_on_loss_recall_validation
-        self.wandb_run.summary["best_model_on_loss_loss_validation"] = best_model_on_loss_loss_validation
-        self.wandb_run.summary["best_model_on_loss_accuracy_validation"] = best_model_on_loss_accuracy_validation
-        if updated_model:
-            self.wandb_run.save(os.path.join(path_dataset, self.experiment_name), policy="live", base_path=path_dataset)
-            self.wandb_run.save(os.path.join(path_dataset, self.experiment_name + "_on_loss"), policy="live", base_path=path_dataset)
-
-    def __del__(self):
-        self.wandb_run.finish()
-
-    def restore(self, classif):
-        if classif:
-            self.wandb_run.restore(self.experiment_name, root=path_dataset)
-        else:
-            self.wandb_run.restore(self.experiment_name + "_on_loss", root=path_dataset)
-
-
-def f1_loss(output, batch_labels):
-    # logging.debug(f"output in loss : {output[:,1]}")
-    # logging.debug(f"batch_labels in loss : {batch_labels}")
-    y_pred = output
-    tp = (batch_labels * y_pred).sum().to(torch.float32)
-    tn = ((1 - batch_labels) * (1 - y_pred)).sum().to(torch.float32).item()
-    fp = ((1 - batch_labels) * y_pred).sum().to(torch.float32)
-    fn = (batch_labels * (1 - y_pred)).sum().to(torch.float32)
-
-    epsilon = 1e-7
-    F1_class1 = 2 * tp / (2 * tp + fp + fn + epsilon)
-    F1_class0 = 2 * tn / (2 * tn + fn + fp + epsilon)
-    New_F1 = (F1_class1 + F1_class0) / 2
-    return 1 - New_F1
-
-
-def run_inference(dataloader, criterion, net, device, hidden_size, nb_rnn_layers, classification, batch_size_validation, max_value=np.inf):
-    net_copy = copy.deepcopy(net)
-    net_copy = net_copy.to(device)
-    net_copy = net_copy.eval()
-    loss = 0
-    n = 0
-    batch_labels_total = torch.tensor([], device=device)
-    output_total = torch.tensor([], device=device)
-    h1 = torch.zeros((nb_rnn_layers, batch_size_validation, hidden_size), device=device)
-    h2 = torch.zeros((nb_rnn_layers, batch_size_validation, hidden_size), device=device)
-    with torch.no_grad():
-        for batch_data in dataloader:
-            batch_samples_input1, batch_samples_input2, batch_samples_input3, batch_labels = batch_data
-            batch_samples_input1 = batch_samples_input1.to(device=device).float()
-            batch_samples_input2 = batch_samples_input2.to(device=device).float()
-            batch_samples_input3 = batch_samples_input3.to(device=device).float()
-            batch_labels = batch_labels.to(device=device).float()
-            if classification:
-                batch_labels = (batch_labels > THRESHOLD)
-                batch_labels = batch_labels.float()
-            output, h1, h2, max_value = net_copy(batch_samples_input1, batch_samples_input2, batch_samples_input3, h1, h2, max_value)
-            # logging.debug(f"label = {batch_labels}")
-            # logging.debug(f"output = {output}")
-            output = output.view(-1)
-            loss_py = criterion(output, batch_labels).mean()
-            loss += loss_py.item()
-            # logging.debug(f"loss = {loss}")
-            if not classification:
-                output = (output > THRESHOLD)
-                batch_labels = (batch_labels > THRESHOLD)
-            else:
-                output = (output >= 0.5)
-            batch_labels_total = torch.cat([batch_labels_total, batch_labels])
-            output_total = torch.cat([output_total, output])
-            # logging.debug(f"batch_label_total : {batch_labels_total}")
-            # logging.debug(f"output_total : {output_total}")
-            n += 1
-
-    loss /= n
-    acc = (output_total == batch_labels_total).float().mean()
-    output_total = output_total.float()
-    batch_labels_total = batch_labels_total.float()
-    tp = (batch_labels_total * output_total)
-    tn = ((1 - batch_labels_total) * (1 - output_total))
-    fp = ((1 - batch_labels_total) * output_total)
-    fn = (batch_labels_total * (1 - output_total))
-    return output_total, batch_labels_total, loss, acc, tp, tn, fp, fn
-
-def run_inference_unlabelled_offline(dataloader, net, device, hidden_size, nb_rnn_layers, classification, batch_size_validation):
-    net_copy = copy.deepcopy(net)
-    net_copy = net_copy.to(device)
-    net_copy = net_copy.eval()
-    true_idx_total = torch.tensor([], device=device)
-    output_total = torch.tensor([], device=device)
-    h1 = torch.zeros((nb_rnn_layers, batch_size_validation, hidden_size), device=device)
-    h2 = torch.zeros((nb_rnn_layers, batch_size_validation, hidden_size), device=device)
-    max_value = np.inf
-    with torch.no_grad():
-        for batch_data in dataloader:
-            batch_samples_input1, batch_true_idx = batch_data
-            batch_samples_input1 = batch_samples_input1.to(device=device).float()
-            output, h1, h2, max_value = net_copy(batch_samples_input1, None, None, h1, h2, max_value)
-            output = output.view(-1)
-            # if not classification:
-            #     output = output  # (output > THRESHOLD)
-            # else:
-            #     output = (output >= 0.5)
-            true_idx_total = torch.cat([true_idx_total, batch_true_idx])
-            output_total = torch.cat([output_total, output])
-    output_total = output_total.float()
-    true_idx_total = true_idx_total.int()
-    return output_total, true_idx_total
-
-def get_metrics(tp, fp, fn):
-    tp_sum = tp.sum().to(torch.float32).item()
-    fp_sum = fp.sum().to(torch.float32).item()
-    fn_sum = fn.sum().to(torch.float32).item()
-    epsilon = 1e-7
-
-    precision = tp_sum / (tp_sum + fp_sum + epsilon)
-    recall = tp_sum / (tp_sum + fn_sum + epsilon)
-
-    f1 = 2 * (precision * recall) / (precision + recall + epsilon)
-
-    return f1, precision, recall
-
-
-# Regression balancing:
-
-
-def get_lds_kernel(ks, sigma):
-    half_ks = (ks - 1) // 2
-    base_kernel = [0.] * half_ks + [1.] + [0.] * half_ks
-    kernel_window = gaussian_filter1d(base_kernel, sigma=sigma) / max(gaussian_filter1d(base_kernel, sigma=sigma))
-    return kernel_window
-
-
-def generate_label_distribution_and_lds(dataset, kernel_size=5, kernel_std=2.0, nb_bins=100, reweight='inv_sqrt'):
-    """
-    Returns:
-        distribution: the distribution of labels in the dataset
-        lds: the same distribution, smoothed with a gaussian kernel
-    """
-
-    weights = torch.tensor([0.3252, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0069, 0.0163,
-                            0.0000, 0.0366, 0.0000, 0.0179, 0.0000, 0.0076, 0.0444, 0.0176, 0.0025,
-                            0.0056, 0.0000, 0.0416, 0.0039, 0.0000, 0.0000, 0.0000, 0.0171, 0.0000,
-                            0.0000, 0.0042, 0.0114, 0.0209, 0.0023, 0.0036, 0.0106, 0.0241, 0.0034,
-                            0.0000, 0.0056, 0.0000, 0.0029, 0.0241, 0.0076, 0.0027, 0.0012, 0.0000,
-                            0.0166, 0.0028, 0.0000, 0.0000, 0.0000, 0.0197, 0.0000, 0.0000, 0.0021,
-                            0.0054, 0.0191, 0.0014, 0.0023, 0.0074, 0.0000, 0.0186, 0.0000, 0.0088,
-                            0.0000, 0.0032, 0.0135, 0.0069, 0.0029, 0.0016, 0.0164, 0.0068, 0.0022,
-                            0.0000, 0.0000, 0.0000, 0.0191, 0.0000, 0.0000, 0.0017, 0.0082, 0.0181,
-                            0.0019, 0.0038, 0.0064, 0.0000, 0.0133, 0.0000, 0.0069, 0.0000, 0.0025,
-                            0.0186, 0.0076, 0.0031, 0.0016, 0.0218, 0.0105, 0.0049, 0.0000, 0.0000,
-                            0.0246], dtype=torch.float64)
-
-    lds = None
-    dist = None
-    bins = None
-    return weights, dist, lds, bins
-
-    # TODO: remove before
-
-    dataset_len = len(dataset)
-    logging.debug(f"Length of the dataset passed to generate_label_distribution_and_lds: {dataset_len}")
-    logging.debug(f"kernel_size: {kernel_size}")
-    logging.debug(f"kernel_std: {kernel_std}")
-    logging.debug(f"Generating empirical distribution...")
-
-    tab = np.array([dataset[i][3].item() for i in range(dataset_len)])
-    tab = np.around(tab, decimals=5)
-    elts = np.unique(tab)
-    logging.debug(f"all labels: {elts}")
-    dist, bins = np.histogram(tab, bins=nb_bins, density=False, range=(0.0, 1.0))
-
-    # dist, bins = np.histogram([dataset[i][3].item() for i in range(dataset_len)], bins=nb_bins, density=False, range=(0.0, 1.0))
-
-    logging.debug(f"dist: {dist}")
-
-    # kernel = get_lds_kernel(kernel_size, kernel_std)
-    # lds = convolve1d(dist, weights=kernel, mode='constant')
-
-    lds = gaussian_filter1d(input=dist, sigma=kernel_std, axis=- 1, order=0, output=None, mode='reflect', cval=0.0, truncate=4.0)
-
-    weights = np.sqrt(lds) if reweight == 'inv_sqrt' else lds
-    # scaling = len(weights) / np.sum(weights)  # not the same implementation as in the original repo
-    scaling = 1.0 / np.sum(weights)
-    weights = weights * scaling
-
-    return weights, dist, lds, bins
-
-
-class LabelDistributionSmoothing:
-    def __init__(self, c=1.0, dataset=None, weights=None, kernel_size=5, kernel_std=2.0, nb_bins=100, weighting_mode="inv_sqrt"):
-        """
-        If provided, lds_distribution must be a numpy.array representing a density over [0.0, 1.0] (e.g. first element of a numpy.histogram)
-        When lds_distribution is provided, it overrides everything else
-        c is the scaling constant for lds weights
-        weighting_mode can be 'inv' or 'inv_sqrt'
-        """
-        assert dataset is not None or weights is not None, "Either a dataset or weights must be provided"
-        self.distribution = None
-        self.bins = None
-        self.lds_distribution = None
-        if weights is None:
-            self.weights, self.distribution, self.lds_distribution, self.bins = generate_label_distribution_and_lds(dataset, kernel_size, kernel_std,
-                                                                                                                    nb_bins, weighting_mode)
-            logging.debug(f"self.distribution: {self.weights}")
-            logging.debug(f"self.lds_distribution: {self.weights}")
-        else:
-            self.weights = weights
-        self.nb_bins = len(self.weights)
-        self.bin_width = 1.0 / self.nb_bins
-        self.c = c
-        logging.debug(f"The LDS distribution has {self.nb_bins} bins of width {self.bin_width}")
-        self.weights = torch.tensor(self.weights)
-
-        logging.debug(f"self.weights: {self.weights}")
-
-    def lds_weights_batch(self, batch_labels):
-        device = batch_labels.device
-        if self.weights.device != device:
-            self.weights = self.weights.to(device)
-        last_bin = 1.0 - self.bin_width
-        batch_idxs = torch.minimum(batch_labels, torch.ones_like(batch_labels) * last_bin) / self.bin_width  # FIXME : double check
-        batch_idxs = batch_idxs.floor().long()
-        res = 1.0 / self.weights[batch_idxs]
-        return res
-
-    def __str__(self):
-        return f"LDS nb_bins: {self.nb_bins}\nbins: {self.bins}\ndistribution: {self.distribution}\nlds_distribution: {self.lds_distribution}\nweights: {self.weights} "
-
-
-class SurpriseReweighting:
-    """
-    Custom reweighting Yann
-    """
-
-    def __init__(self, weights=None, nb_bins=100, alpha=1e-3):
-        if weights is None:
-            self.weights = [1.0, ] * nb_bins
-            self.weights = torch.tensor(self.weights)
-            self.weights = self.weights / torch.sum(self.weights)
-        else:
-            self.weights = weights
-        self.weights = self.weights.detach()
-        self.nb_bins = len(self.weights)
-        self.bin_width = 1.0 / self.nb_bins
-        self.alpha = alpha
-        logging.debug(f"The SR distribution has {self.nb_bins} bins of width {self.bin_width}")
-        logging.debug(f"Initial self.weights: {self.weights}")
-
-    def update_and_get_weighted_loss(self, batch_labels, unweighted_loss):
-        device = batch_labels.device
-        if self.weights.device != device:
-            logging.debug(f"Moving SR weights to {device}")
-            self.weights = self.weights.to(device)
-        last_bin = 1.0 - self.bin_width
-        batch_idxs = torch.minimum(batch_labels, torch.ones_like(batch_labels) * last_bin) / self.bin_width  # FIXME : double check
-        batch_idxs = batch_idxs.floor().long()
-        self.weights = self.weights.detach()  # ensure no gradients
-        weights = copy.deepcopy(self.weights[batch_idxs])
-        res = unweighted_loss * weights
-        with torch.no_grad():
-            abs_loss = torch.abs(unweighted_loss)
-
-            # compute the mean loss per idx
-
-            num = torch.zeros(self.nb_bins, device=device)
-            num = num.index_add(0, batch_idxs, abs_loss)
-            bincount = torch.bincount(batch_idxs, minlength=self.nb_bins)
-            div = bincount.float()
-            idx_unchanged = bincount == 0
-            idx_changed = bincount != 0
-            div[idx_unchanged] = 1.0
-            mean_loss_per_idx_normalized = num / div
-            sum_changed_weights = torch.sum(self.weights[idx_changed])
-            sum_mean_loss = torch.sum(mean_loss_per_idx_normalized[idx_changed])
-            mean_loss_per_idx_normalized[idx_changed] = mean_loss_per_idx_normalized[idx_changed] * sum_changed_weights / sum_mean_loss
-            # logging.debug(f"old self.weights: {self.weights}")
-            self.weights[idx_changed] = (1.0 - self.alpha) * self.weights[idx_changed] + self.alpha * mean_loss_per_idx_normalized[idx_changed]
-            self.weights /= torch.sum(self.weights)  # force sum to 1
-            # logging.debug(f"unique_idx: {unique_idx}")
-            # logging.debug(f"new self.weights: {self.weights}")
-            # logging.debug(f"new torch.sum(self.weights): {torch.sum(self.weights)}")
-        return torch.sqrt(res * self.nb_bins)
-
-    def __str__(self):
-        return f"LDS nb_bins: {self.nb_bins}\nweights: {self.weights}"
-
-
-# run:
-
-def generate_dataloader(window_size, fe, seq_len, seq_stride, distribution_mode, batch_size, nb_batch_per_epoch, classification, split_i,
-                        network_stride):
-    all_subject = pd.read_csv(Path(path_dataset) / subject_list, header=None, delim_whitespace=True).to_numpy()
-    test_subject = None
-    if PHASE == 'full':
-        p1_subject = pd.read_csv(Path(path_dataset) / subject_list_p1, header=None, delim_whitespace=True).to_numpy()
-        p2_subject = pd.read_csv(Path(path_dataset) / subject_list_p2, header=None, delim_whitespace=True).to_numpy()
-        train_subject_p1, validation_subject_p1 = train_test_split(p1_subject, train_size=0.8, random_state=split_i)
-        if TEST_SET:
-            test_subject_p1, validation_subject_p1 = train_test_split(validation_subject_p1, train_size=0.5, random_state=split_i)
-        train_subject_p2, validation_subject_p2 = train_test_split(p2_subject, train_size=0.8, random_state=split_i)
-        if TEST_SET:
-            test_subject_p2, validation_subject_p2 = train_test_split(validation_subject_p2, train_size=0.5, random_state=split_i)
-        train_subject = np.array([s for s in all_subject if s[0] in train_subject_p1[:, 0] or s[0] in train_subject_p2[:, 0]]).squeeze()
-        if TEST_SET:
-            test_subject = np.array([s for s in all_subject if s[0] in test_subject_p1[:, 0] or s[0] in test_subject_p2[:, 0]]).squeeze()
-        validation_subject = np.array(
-            [s for s in all_subject if s[0] in validation_subject_p1[:, 0] or s[0] in validation_subject_p2[:, 0]]).squeeze()
-    else:
-        train_subject, validation_subject = train_test_split(all_subject, train_size=0.8, random_state=split_i)
-        if TEST_SET:
-            test_subject, validation_subject = train_test_split(validation_subject, train_size=0.5, random_state=split_i)
-    logging.debug(f"Subjects in training : {train_subject[:, 0]}")
-    logging.debug(f"Subjects in validation : {validation_subject[:, 0]}")
-    if TEST_SET:
-        logging.debug(f"Subjects in test : {test_subject[:, 0]}")
-
-    len_segment = LEN_SEGMENT * fe
-    train_loader = None
-    validation_loader = None
-    test_loader = None
-    batch_size_validation = None
-    batch_size_test = None
-    filename = filename_classification_dataset if classification else filename_regression_dataset
-
-    if seq_len is not None:
-        nb_segment_validation = len(np.hstack([range(int(s[1]), int(s[2])) for s in validation_subject]))
-        batch_size_validation = len(list(range(0, (seq_stride // network_stride) * network_stride, network_stride))) * nb_segment_validation
-
-        ds_train = SignalDataset(filename=filename,
-                                 path=path_dataset,
-                                 window_size=window_size,
-                                 fe=fe,
-                                 seq_len=seq_len,
-                                 seq_stride=seq_stride,
-                                 list_subject=train_subject,
-                                 len_segment=len_segment)
-
-        ds_validation = SignalDataset(filename=filename,
-                                      path=path_dataset,
-                                      window_size=window_size,
-                                      fe=fe,
-                                      seq_len=1,
-                                      seq_stride=1,  # just to be sure, fixed value
-                                      list_subject=validation_subject,
-                                      len_segment=len_segment)
-        idx_true, idx_false = get_class_idxs(ds_train, distribution_mode)
-        samp_train = RandomSampler(idx_true=idx_true,
-                                   idx_false=idx_false,
-                                   batch_size=batch_size,
-                                   nb_batch=nb_batch_per_epoch,
-                                   distribution_mode=distribution_mode)
-
-        samp_validation = ValidationSampler(ds_validation,
-                                            seq_stride=seq_stride,
-                                            len_segment=len_segment,
-                                            nb_segment=nb_segment_validation,
-                                            network_stride=network_stride)
-        train_loader = DataLoader(ds_train,
-                                  batch_size=batch_size,
-                                  sampler=samp_train,
-                                  shuffle=False,
-                                  num_workers=0,
-                                  pin_memory=True)
-
-        validation_loader = DataLoader(ds_validation,
-                                       batch_size=batch_size_validation,
-                                       sampler=samp_validation,
-                                       num_workers=0,
-                                       pin_memory=True,
-                                       shuffle=False)
-    else:
-        nb_segment_test = len(np.hstack([range(int(s[1]), int(s[2])) for s in test_subject]))
-        batch_size_test = len(list(range(0, (seq_stride // network_stride) * network_stride, network_stride))) * nb_segment_test
-
-        ds_test = SignalDataset(filename=filename,
-                                path=path_dataset,
-                                window_size=window_size,
-                                fe=fe,
-                                seq_len=1,
-                                seq_stride=1,  # just to be sure, fixed value
-                                list_subject=test_subject,
-                                len_segment=len_segment)
-
-        samp_test = ValidationSampler(ds_test,
-                                      seq_stride=seq_stride,
-                                      len_segment=len_segment,
-                                      nb_segment=nb_segment_test,
-                                      network_stride=network_stride)
-
-        test_loader = DataLoader(ds_test,
-                                 batch_size=batch_size_test,
-                                 sampler=samp_test,
-                                 num_workers=0,
-                                 pin_memory=True,
-                                 shuffle=False)
-
-    return train_loader, validation_loader, batch_size_validation, test_loader, batch_size_test, test_subject
-
-def generate_dataloader_unlabelled_offline(unlabelled_segment,
-                                           window_size,
-                                           seq_stride,
-                                           network_stride):
-    nb_segment_test = 1
-    batch_size_test = len(list(range(0, (seq_stride // network_stride) * network_stride, network_stride))) * nb_segment_test
-    unlabelled_segment = torch.tensor(unlabelled_segment, dtype=torch.float).squeeze()
-    assert len(unlabelled_segment.shape) == 1, f"Segment has more than one dimension: {unlabelled_segment.shape}"
-    len_segment = len(unlabelled_segment)
-    ds_test = UnlabelledSignalDatasetSingleSegment(unlabelled_segment=unlabelled_segment,
-                                                   window_size=window_size)
-    samp_test = ValidationSampler(ds_test,
-                                  seq_stride=seq_stride,
-                                  len_segment=len_segment-window_size,  # because we don't have additional data at the end on the signal here
-                                  nb_segment=nb_segment_test,
-                                  network_stride=network_stride)
-
-    test_loader = DataLoader(ds_test,
-                             batch_size=batch_size_test,
-                             sampler=samp_test,
-                             num_workers=0,
-                             pin_memory=True,
-                             shuffle=False)
-
-    return test_loader, batch_size_test
-
-def run(config_dict, wandb_project, save_model, unique_name):
-    global precision_validation_factor
-    global recall_validation_factor
-    _t_start = time.time()
-    logging.debug(f"config_dict: {config_dict}")
-    experiment_name = f"{config_dict['experiment_name']}_{time.time_ns()}" if unique_name else config_dict['experiment_name']
-    nb_epoch_max = config_dict["nb_epoch_max"]
-    nb_batch_per_epoch = config_dict["nb_batch_per_epoch"]
-    nb_epoch_early_stopping_stop = config_dict["nb_epoch_early_stopping_stop"]
-    early_stopping_smoothing_factor = config_dict["early_stopping_smoothing_factor"]
-    batch_size = config_dict["batch_size"]
-    seq_len = config_dict["seq_len"]
-    window_size_s = config_dict["window_size_s"]
-    fe = config_dict["fe"]
-    seq_stride_s = config_dict["seq_stride_s"]
-    lr_adam = config_dict["lr_adam"]
-    hidden_size = config_dict["hidden_size"]
-    device_val = config_dict["device_val"]
-    device_train = config_dict["device_train"]
-    max_duration = config_dict["max_duration"]
-    nb_rnn_layers = config_dict["nb_rnn_layers"]
-    adam_w = config_dict["adam_w"]
-    distribution_mode = config_dict["distribution_mode"]
-    classification = config_dict["classification"]
-    reg_balancing = config_dict["reg_balancing"]
-    split_idx = config_dict["split_idx"]
-    validation_network_stride = config_dict["validation_network_stride"]
-
-    assert reg_balancing in {'none', 'lds', 'sr'}, f"wrong key: {reg_balancing}"
-    assert classification or distribution_mode == 1, "distribution_mode must be 1 (no class balancing) in regression mode"
-    balancer_type = 0
-    lds = None
-    sr = None
-    if reg_balancing == 'lds':
-        balancer_type = 1
-    elif reg_balancing == 'sr':
-        balancer_type = 2
-
-    window_size = int(window_size_s * fe)
-    seq_stride = int(seq_stride_s * fe)
-
-    if device_val.startswith("cuda") or device_train.startswith("cuda"):
-        assert torch.cuda.is_available(), "CUDA unavailable"
-
-    logger = LoggerWandb(experiment_name, config_dict, wandb_project)
-    torch.seed()
-    net = PortiloopNetwork(config_dict).to(device=device_train)
-    criterion = nn.MSELoss(reduction='none') if not classification else nn.BCELoss(reduction='none')
-    # criterion = nn.MSELoss() if not classification else nn.BCELoss()
-    optimizer = optim.AdamW(net.parameters(), lr=lr_adam, weight_decay=adam_w)
-    best_loss_early_stopping = 1
-    best_epoch_early_stopping = 0
-    best_model_precision_validation = 0
-    best_model_f1_score_validation = 0
-    best_model_recall_validation = 0
-    best_model_loss_validation = 1
-
-    best_model_on_loss_accuracy = 0
-    best_model_on_loss_precision_validation = 0
-    best_model_on_loss_f1_score_validation = 0
-    best_model_on_loss_recall_validation = 0
-    best_model_on_loss_loss_validation = 1
-
-    first_epoch = 0
-    try:
-        logger.restore(classification)
-        file_exp = experiment_name
-        file_exp += "" if classification else "_on_loss"
-        checkpoint = torch.load(path_dataset / file_exp)
-        logging.debug("Use checkpoint model")
-        net.load_state_dict(checkpoint['model_state_dict'])
-        optimizer.load_state_dict(checkpoint['optimizer_state_dict'])
-        first_epoch = checkpoint['epoch'] + 1
-        recall_validation_factor = checkpoint['recall_validation_factor']
-        precision_validation_factor = checkpoint['precision_validation_factor']
-        best_model_on_loss_loss_validation = checkpoint['best_model_on_loss_loss_validation']
-        best_model_f1_score_validation = checkpoint['best_model_f1_score_validation']
-    except (ValueError, FileNotFoundError):
-        #    net = PortiloopNetwork(config_dict).to(device=device_train)
-        logging.debug("Create new model")
-    net = net.train()
-    nb_weights = 0
-    for i in net.parameters():
-        nb_weights += len(i)
-    has_envelope = 1
-    if config_dict["envelope_input"]:
-        has_envelope = 2
-    config_dict["estimator_size_memory"] = nb_weights * window_size * seq_len * batch_size * has_envelope
-
-    train_loader, validation_loader, batch_size_validation, _, _, _ = generate_dataloader(window_size, fe, seq_len, seq_stride, distribution_mode,
-                                                                                          batch_size, nb_batch_per_epoch, classification, split_idx,
-                                                                                          validation_network_stride)
-    if balancer_type == 1:
-        lds = LabelDistributionSmoothing(c=1.0, dataset=train_loader.dataset, weights=None, kernel_size=5, kernel_std=0.01, nb_bins=100,
-                                         weighting_mode='inv_sqrt')
-    elif balancer_type == 2:
-        sr = SurpriseReweighting(weights=None, nb_bins=100, alpha=1e-3)
-
-    best_model_accuracy = 0
-    best_epoch = 0
-    best_model = None
-
-    accuracy_train = None
-    loss_train = None
-
-    early_stopping_counter = 0
-    loss_early_stopping = None
-    h1_zero = torch.zeros((nb_rnn_layers, batch_size, hidden_size), device=device_train)
-    h2_zero = torch.zeros((nb_rnn_layers, batch_size, hidden_size), device=device_train)
-    for epoch in range(first_epoch, first_epoch + nb_epoch_max):
-
-        logging.debug(f"epoch: {epoch}")
-
-        n = 0
-        if epoch > -1:
-            accuracy_train = 0
-            loss_train = 0
-            _t_start = time.time()
-            for batch_data in train_loader:
-                batch_samples_input1, batch_samples_input2, batch_samples_input3, batch_labels = batch_data
-                batch_samples_input1 = batch_samples_input1.to(device=device_train).float()
-                batch_samples_input2 = batch_samples_input2.to(device=device_train).float()
-                batch_samples_input3 = batch_samples_input3.to(device=device_train).float()
-                batch_labels = batch_labels.to(device=device_train).float()
-
-                optimizer.zero_grad()
-                if classification:
-                    batch_labels = (batch_labels > THRESHOLD)
-                    batch_labels = batch_labels.float()
-
-                output, _, _, _ = net(batch_samples_input1, batch_samples_input2, batch_samples_input3, h1_zero, h2_zero)
-
-                output = output.view(-1)
-
-                loss = criterion(output, batch_labels)
-
-                if balancer_type == 1:
-                    batch_weights = lds.lds_weights_batch(batch_labels)
-                    loss = loss * batch_weights
-                    error = batch_weights.isinf().any().item() or batch_weights.isnan().any().item() or torch.isnan(
-                        loss).any().item() or torch.isinf(loss).any().item()
-                    if error:
-                        logging.debug(f"batch_labels: {batch_labels}")
-                        logging.debug(f"batch_weights: {batch_weights}")
-                        logging.debug(f"loss: {loss}")
-                        logging.debug(f"LDS: {lds}")
-                        assert False, "loss is nan or inf"
-                elif balancer_type == 2:
-                    loss = sr.update_and_get_weighted_loss(batch_labels=batch_labels, unweighted_loss=loss)
-                    error = torch.isnan(loss).any().item() or torch.isinf(loss).any().item()
-                    if error:
-                        logging.debug(f"batch_labels: {batch_labels}")
-                        logging.debug(f"loss: {loss}")
-                        logging.debug(f"SR: {sr}")
-                        assert False, "loss is nan or inf"
-
-                loss = loss.mean()
-
-                loss_train += loss.item()
-                loss.backward()
-                optimizer.step()
-
-                if not classification:
-                    output = (output > THRESHOLD)
-                    batch_labels = (batch_labels > THRESHOLD)
-                else:
-                    output = (output >= 0.5)
-                accuracy_train += (output == batch_labels).float().mean()
-                n += 1
-            _t_stop = time.time()
-            logging.debug(f"Training time for 1 epoch : {_t_stop - _t_start} s")
-            accuracy_train /= n
-            loss_train /= n
-
-            _t_start = time.time()
-        output_validation, labels_validation, loss_validation, accuracy_validation, tp, tn, fp, fn = run_inference(validation_loader, criterion, net,
-                                                                                                                   device_val, hidden_size,
-                                                                                                                   nb_rnn_layers, classification,
-                                                                                                                   batch_size_validation)
-        f1_validation, precision_validation, recall_validation = get_metrics(tp, fp, fn)
-
-        _t_stop = time.time()
-        logging.debug(f"Validation time for 1 epoch : {_t_stop - _t_start} s")
-
-        recall_validation_factor = recall_validation
-        precision_validation_factor = precision_validation
-        updated_model = False
-        if f1_validation > best_model_f1_score_validation:
-            best_model = copy.deepcopy(net)
-            best_epoch = epoch
-            # torch.save(best_model.state_dict(), path_dataset / experiment_name, _use_new_zipfile_serialization=False)
-            if save_model:
-                torch.save({
-                    'epoch': epoch,
-                    'model_state_dict': best_model.state_dict(),
-                    'optimizer_state_dict': optimizer.state_dict(),
-                    'recall_validation_factor': recall_validation_factor,
-                    'precision_validation_factor': precision_validation_factor,
-                    'best_model_on_loss_loss_validation': best_model_on_loss_loss_validation,
-                    'best_model_f1_score_validation': best_model_f1_score_validation,
-                }, path_dataset / experiment_name, _use_new_zipfile_serialization=False)
-                updated_model = True
-            best_model_f1_score_validation = f1_validation
-            best_model_precision_validation = precision_validation
-            best_model_recall_validation = recall_validation
-            best_model_loss_validation = loss_validation
-            best_model_accuracy = accuracy_validation
-        if loss_validation < best_model_on_loss_loss_validation:
-            best_model = copy.deepcopy(net)
-            best_epoch = epoch
-            # torch.save(best_model.state_dict(), path_dataset / experiment_name, _use_new_zipfile_serialization=False)
-            if save_model:
-                torch.save({
-                    'epoch': epoch,
-                    'model_state_dict': best_model.state_dict(),
-                    'optimizer_state_dict': optimizer.state_dict(),
-                    'recall_validation_factor': recall_validation_factor,
-                    'precision_validation_factor': precision_validation_factor,
-                    'best_model_on_loss_loss_validation': best_model_on_loss_loss_validation,
-                    'best_model_f1_score_validation': best_model_f1_score_validation,
-                }, path_dataset / (experiment_name + "_on_loss"), _use_new_zipfile_serialization=False)
-                updated_model = True
-            best_model_on_loss_f1_score_validation = f1_validation
-            best_model_on_loss_precision_validation = precision_validation
-            best_model_on_loss_recall_validation = recall_validation
-            best_model_on_loss_loss_validation = loss_validation
-            best_model_on_loss_accuracy = accuracy_validation
-
-        loss_early_stopping = loss_validation if loss_early_stopping is None and early_stopping_smoothing_factor == 1 else loss_validation if loss_early_stopping is None else loss_validation * early_stopping_smoothing_factor + loss_early_stopping * (
-                1.0 - early_stopping_smoothing_factor)
-
-        if loss_early_stopping < best_loss_early_stopping:
-            best_loss_early_stopping = loss_early_stopping
-            early_stopping_counter = 0
-            best_epoch_early_stopping = epoch
-        else:
-            early_stopping_counter += 1
-
-        logger.log(accuracy_train=accuracy_train,
-                   loss_train=loss_train,
-                   accuracy_validation=accuracy_validation,
-                   loss_validation=loss_validation,
-                   f1_validation=f1_validation,
-                   precision_validation=precision_validation,
-                   recall_validation=recall_validation,
-                   best_epoch=best_epoch,
-                   best_model=best_model,
-                   loss_early_stopping=loss_early_stopping,
-                   best_epoch_early_stopping=best_epoch_early_stopping,
-                   best_model_accuracy_validation=best_model_accuracy,
-                   best_model_f1_score_validation=best_model_f1_score_validation,
-                   best_model_precision_validation=best_model_precision_validation,
-                   best_model_recall_validation=best_model_recall_validation,
-                   best_model_loss_validation=best_model_loss_validation,
-                   best_model_on_loss_accuracy_validation=best_model_on_loss_accuracy,
-                   best_model_on_loss_f1_score_validation=best_model_on_loss_f1_score_validation,
-                   best_model_on_loss_precision_validation=best_model_on_loss_precision_validation,
-                   best_model_on_loss_recall_validation=best_model_on_loss_recall_validation,
-                   best_model_on_loss_loss_validation=best_model_on_loss_loss_validation,
-                   updated_model=updated_model)
-
-        if early_stopping_counter > nb_epoch_early_stopping_stop or time.time() - _t_start > max_duration:
-            logging.debug("Early stopping.")
-            break
-    logging.debug("Delete logger")
-    del logger
-    logging.debug("Logger deleted")
-    return best_model_loss_validation, best_model_f1_score_validation, best_epoch_early_stopping
-
-def run_offline_unlabelled(config_dict, path_experiments, unlabelled_segment):
-    logging.debug(f"config_dict: {config_dict}")
-    experiment_name = config_dict['experiment_name']
-    window_size_s = config_dict["window_size_s"]
-    fe = config_dict["fe"]
-    seq_stride_s = config_dict["seq_stride_s"]
-    hidden_size = config_dict["hidden_size"]
-    device_inference = config_dict["device_inference"]
-    nb_rnn_layers = config_dict["nb_rnn_layers"]
-    classification = config_dict["classification"]
-    validation_network_stride = config_dict["validation_network_stride"]
-
-    window_size = int(window_size_s * fe)
-    seq_stride = int(seq_stride_s * fe)
-
-    if device_inference.startswith("cuda"):
-        assert torch.cuda.is_available(), "CUDA unavailable"
-
-    torch.seed()
-    net = PortiloopNetwork(config_dict).to(device=device_inference)
-
-    file_exp = experiment_name
-    file_exp += "" if classification else "_on_loss"
-    path_experiments = Path(path_experiments)
-    if not device_inference.startswith("cuda"):
-        checkpoint = torch.load(path_experiments / file_exp, map_location=torch.device('cpu'))
-    else:
-        checkpoint = torch.load(path_experiments / file_exp)
-    logging.debug("Use checkpoint model")
-    net.load_state_dict(checkpoint['model_state_dict'])
-
-    test_loader, batch_size_test = generate_dataloader_unlabelled_offline(unlabelled_segment=unlabelled_segment,
-                                                                          window_size=window_size,
-                                                                          seq_stride=seq_stride,
-                                                                          network_stride=validation_network_stride)
-
-    output_total, true_idx_total = run_inference_unlabelled_offline(dataloader=test_loader,
-                                                                    net=net,
-                                                                    device=device_inference,
-                                                                    hidden_size=hidden_size,
-                                                                    nb_rnn_layers=nb_rnn_layers,
-                                                                    classification=classification,
-                                                                    batch_size_validation=batch_size_test)
-    return output_total, true_idx_total
-
-
-
-def get_config_dict(index, split_i):
-    # config_dict = {'experiment_name': f'pareto_search_10_619_{index}', 'device_train': 'cuda:0', 'device_val': 'cuda:0', 'nb_epoch_max': 1000,
-    # 'max_duration': 257400, 'nb_epoch_early_stopping_stop': 20, 'early_stopping_smoothing_factor': 0.1, 'fe': 250, 'nb_batch_per_epoch': 5000,
-    # 'first_layer_dropout': False, 'power_features_input': False, 'dropout': 0.5, 'adam_w': 0.01, 'distribution_mode': 0, 'classification': True,
-    # 'nb_conv_layers': 3, 'seq_len': 50, 'nb_channel': 16, 'hidden_size': 32, 'seq_stride_s': 0.08600000000000001, 'nb_rnn_layers': 1,
-    # 'RNN': True, 'envelope_input': True, 'window_size_s': 0.266, 'stride_pool': 1, 'stride_conv': 1, 'kernel_conv': 9, 'kernel_pool': 7,
-    # 'dilation_conv': 1, 'dilation_pool': 1, 'nb_out': 24, 'time_in_past': 4.300000000000001, 'estimator_size_memory': 1628774400, "batch_size":
-    # batch_size_list[index % len(batch_size_list)], "lr_adam": lr_adam_list[index % len(lr_adam_list)]}
-    c_dict = {'experiment_name': f'spindleNet_{index}', 'device_train': 'cuda:0', 'device_val':
-        'cuda:0', 'nb_epoch_max': 500,
-              'max_duration': 257400, 'nb_epoch_early_stopping_stop': 100, 'early_stopping_smoothing_factor': 0.1, 'fe': 250,
-              'nb_batch_per_epoch': 1000,
-              'first_layer_dropout': False,
-              'power_features_input': True, 'dropout': 0.5, 'adam_w': 0.01, 'distribution_mode': 0, 'classification': True,
-              'reg_balancing': 'none',
-              'nb_conv_layers': 5,
-              'seq_len': 50, 'nb_channel': 40, 'hidden_size': 100, 'seq_stride_s': 0.004, 'nb_rnn_layers': 1, 'RNN': True,
-              'envelope_input': True,
-              "batch_size": 20, "lr_adam": 0.0009,
-              'window_size_s': 0.250, 'stride_pool': 1, 'stride_conv': 1, 'kernel_conv': 7, 'kernel_pool': 5,
-              'dilation_conv': 1, 'dilation_pool': 1, 'nb_out': 2, 'time_in_past': 1.55, 'estimator_size_memory': 139942400}
-    # put LSTM and Softmax for the occasion and add padding, not exactly the same frequency (spindleNet = 200 Hz)
-
-    c_dict = {'experiment_name': f'ABLATION_{ABLATION}_test_v11_implemented_on_portiloop_{index}', 'device_train': 'cuda:0', 'device_val':
-        'cuda:0', 'nb_epoch_max': 500,
-              'max_duration': 257400, 'nb_epoch_early_stopping_stop': 100, 'early_stopping_smoothing_factor': 0.1, 'fe': 250,
-              'nb_batch_per_epoch': 1000,
-              'first_layer_dropout': False,
-              'power_features_input': False, 'dropout': 0.5, 'adam_w': 0.01, 'distribution_mode': 0, 'classification': True,
-              'reg_balancing': 'none',
-              'nb_conv_layers': 4,
-              'seq_len': 50, 'nb_channel': 26, 'hidden_size': 7, 'seq_stride_s': 0.044, 'nb_rnn_layers': 2, 'RNN': True,
-              'envelope_input': True,
-              "batch_size": 256, "lr_adam": 0.0009,
-              'window_size_s': 0.234, 'stride_pool': 1, 'stride_conv': 1, 'kernel_conv': 7, 'kernel_pool': 9,
-              'dilation_conv': 1, 'dilation_pool': 1, 'nb_out': 2, 'time_in_past': 1.55, 'estimator_size_memory': 139942400,
-              'split_idx': split_i, 'validation_network_stride': 1}
-    c_dict = {'experiment_name': f'pareto_search_15_35_v5_small_seq_{index}', 'device_train': 'cuda:0', 'device_val': 'cuda:0', 'nb_epoch_max': 150,
-              'max_duration':
-                  257400,
-              'nb_epoch_early_stopping_stop': 100, 'early_stopping_smoothing_factor': 0.1, 'fe': 250, 'nb_batch_per_epoch': 1000,
-              'first_layer_dropout': False,
-              'power_features_input': False, 'dropout': 0.5, 'adam_w': 0.01, 'distribution_mode': 0, 'classification': True,
-              'reg_balancing': 'none',
-              'split_idx': split_i, 'validation_network_stride': 1, 'nb_conv_layers': 3, 'seq_len': 50, 'nb_channel': 31, 'hidden_size': 7,
-              'seq_stride_s': 0.02,
-              'nb_rnn_layers': 1, 'RNN': True, 'envelope_input': False, 'lr_adam': 0.0005, 'batch_size': 256, 'window_size_s': 0.218,
-              'stride_pool': 1,
-              'stride_conv': 1, 'kernel_conv': 7, 'kernel_pool': 7, 'dilation_conv': 1, 'dilation_pool': 1, 'nb_out': 18, 'time_in_past': 8.5,
-              'estimator_size_memory': 188006400}
-    c_dict = {'experiment_name': f'ABLATION_{ABLATION}_2inputs_network_{index}', 'device_train': 'cuda:0', 'device_val':
-        'cuda:0', 'nb_epoch_max': 500,
-              'max_duration': 257400, 'nb_epoch_early_stopping_stop': 100, 'early_stopping_smoothing_factor': 0.1, 'fe': 250,
-              'nb_batch_per_epoch': 1000,
-              'first_layer_dropout': False,
-              'power_features_input': False, 'dropout': 0.5, 'adam_w': 0.01, 'distribution_mode': 0, 'classification': True,
-              'reg_balancing': 'none',
-              'nb_conv_layers': 4,
-              'seq_len': 50, 'nb_channel': 26, 'hidden_size': 7, 'seq_stride_s': 0.044, 'nb_rnn_layers': 2, 'RNN': True,
-              'envelope_input': True,
-              "batch_size": 256, "lr_adam": 0.0009,
-              'window_size_s': 0.234, 'stride_pool': 1, 'stride_conv': 1, 'kernel_conv': 7, 'kernel_pool': 9,
-              'dilation_conv': 1, 'dilation_pool': 1, 'nb_out': 2, 'time_in_past': 1.55, 'estimator_size_memory': 139942400,
-              'split_idx': split_i, 'validation_network_stride': 1}
-    c_dict = {'experiment_name': f'pareto_search_15_35_v6_{index}', 'device_train': 'cuda:0', 'device_val': 'cuda:0', 'nb_epoch_max': 500,
-              'max_duration':
-                  257400,
-              'nb_epoch_early_stopping_stop': 100, 'early_stopping_smoothing_factor': 0.1, 'fe': 250, 'nb_batch_per_epoch': 1000,
-              'first_layer_dropout': False,
-              'power_features_input': False, 'dropout': 0.5, 'adam_w': 0.01, 'distribution_mode': 0, 'classification': True,
-              'reg_balancing': 'none',
-              'split_idx': split_i, 'validation_network_stride': 1, 'nb_conv_layers': 3, 'seq_len': 50, 'nb_channel': 31, 'hidden_size': 7,
-              'seq_stride_s': 0.17,
-              'nb_rnn_layers': 1, 'RNN': True, 'envelope_input': False, 'lr_adam': 0.0005, 'batch_size': 256, 'window_size_s': 0.218,
-              'stride_pool': 1,
-              'stride_conv': 1, 'kernel_conv': 7, 'kernel_pool': 7, 'dilation_conv': 1, 'dilation_pool': 1, 'nb_out': 18, 'time_in_past': 8.5,
-              'estimator_size_memory': 188006400}
-    return c_dict
-
-def get_final_model_config_dict(index=0, split_i=0):
-    """
-    Configuration dictionary of the final 1-input pre-trained model presented in the Portiloop paper.
-
-    Args:
-        index: last number in the name of the pre-trained model (several are provided)
-        split_i: index of the random train/validation/test split (you can ignore this for inference)
-
-    Returns:
-        configuration dictionary of the pre-trained model
-    """
-    c_dict = {'experiment_name': f'pareto_search_15_35_v4_{index}', 'device_train': 'cpu', 'device_val': 'cpu',
-              'device_inference': 'cpu', 'nb_epoch_max': 150, 'max_duration': 257400,
-              'nb_epoch_early_stopping_stop': 100, 'early_stopping_smoothing_factor': 0.1, 'fe': 250,
-              'nb_batch_per_epoch': 1000,
-              'first_layer_dropout': False,
-              'power_features_input': False, 'dropout': 0.5, 'adam_w': 0.01, 'distribution_mode': 0,
-              'classification': True,
-              'reg_balancing': 'none',
-              'split_idx': split_i, 'validation_network_stride': 1, 'nb_conv_layers': 3, 'seq_len': 50,
-              'nb_channel': 31, 'hidden_size': 7,
-              'seq_stride_s': 0.170,
-              'nb_rnn_layers': 1, 'RNN': True, 'envelope_input': False, 'lr_adam': 0.0005, 'batch_size': 256,
-              'window_size_s': 0.218,
-              'stride_pool': 1,
-              'stride_conv': 1, 'kernel_conv': 7, 'kernel_pool': 7, 'dilation_conv': 1, 'dilation_pool': 1,
-              'nb_out': 18, 'time_in_past': 8.5,
-              'estimator_size_memory': 188006400}
-    return c_dict
-
-if __name__ == "__main__":
-    parser = ArgumentParser()
-    parser.add_argument('--experiment_name', type=str)
-    parser.add_argument('--experiment_index', type=int)
-    parser.add_argument('--output_file', type=str, default=None)
-    parser.add_argument('--phase', type=str, default='full')
-    parser.add_argument('--ablation', type=int, default=0)
-    parser.add_argument('--max_split', type=int, default=10)
-    feature_parser = parser.add_mutually_exclusive_group(required=False)
-    feature_parser.add_argument('--test_set', dest='test_set', action='store_true')
-    feature_parser.add_argument('--no_test_set', dest='test_set', action='store_false')
-    parser.set_defaults(test_set=True)
-    feature_class_parser = parser.add_mutually_exclusive_group(required=False)
-    feature_class_parser.add_argument('--classification', dest='classification', action='store_true')
-    feature_class_parser.add_argument('--regression', dest='classification', action='store_false')
-    parser.set_defaults(classification=True)
-    args = parser.parse_args()
-    if args.output_file is not None:
-        logging.basicConfig(format='%(levelname)s: %(message)s', filename=args.output_file, level=logging.DEBUG)
-    else:
-        logging.basicConfig(format='%(levelname)s: %(message)s', level=logging.DEBUG)
-    ABLATION = args.ablation  # 0 : no ablation, 1 : remove input 1, 2 : remove input 2
-    PHASE = args.phase
-    WANDB_PROJECT_RUN = f"{PHASE}-dataset-public"
-    threshold_list = {'p1': 0.2, 'p2': 0.35, 'full': 0.2}  # full = p1 + p2
-    THRESHOLD = threshold_list[PHASE]
-    # WANDB_PROJECT_RUN = f"tests_yann"
-
-    filename_regression_dataset = f"dataset_regression_{PHASE}_big_250_matlab_standardized_envelope_pf.txt"
-    filename_classification_dataset = f"dataset_classification_{PHASE}_big_250_matlab_standardized_envelope_pf.txt"
-    subject_list = f"subject_sequence_{PHASE}_big.txt"
-    subject_list_p1 = f"subject_sequence_p1_big.txt"
-    subject_list_p2 = f"subject_sequence_p2_big.txt"
-
-    max_split = args.max_split
-    exp_name = args.experiment_name
-    exp_index = args.experiment_index
-    possible_split = [0, 2]
-    split_idx = possible_split[exp_index % 2]
-    classification = args.classification
-    TEST_SET = args.test_set
-    logging.debug(f"classification: {classification}")
-    config_dict = get_config_dict(exp_index, split_idx)
-    config_dict['distribution_mode'] = 0 if classification else 1
-    config_dict['classification'] = classification
-    config_dict['experiment_name'] += "_regression" if not classification else ""
-    config_dict['experiment_name'] += "_no_test" if not TEST_SET else ""
-    seed()  # reset the seed
-    # config_dict = {'experiment_name': 'pareto_search_10_619', 'device_train': 'cuda:0', 'device_val': 'cuda:0', 'nb_epoch_max': 11,
-    # 'max_duration': 257400, 'nb_epoch_early_stopping_stop': 10, 'early_stopping_smoothing_factor': 0.1, 'fe': 250, 'nb_batch_per_epoch': 5000,
-    # 'batch_size': 256, 'first_layer_dropout': False, 'power_features_input': False, 'dropout': 0.5, 'adam_w': 0.01, 'distribution_mode': 0,
-    # 'classification': True, 'nb_conv_layers': 3, 'seq_len': 50, 'nb_channel': 16, 'hidden_size': 32, 'seq_stride_s': 0.08600000000000001,
-    # 'nb_rnn_layers': 1, 'RNN': True, 'envelope_input': True, 'lr_adam': 0.0007, 'window_size_s': 0.266, 'stride_pool': 1, 'stride_conv': 1,
-    # 'kernel_conv': 9, 'kernel_pool': 7, 'dilation_conv': 1, 'dilation_pool': 1, 'nb_out': 24, 'time_in_past': 4.300000000000001,
-    # 'estimator_size_memory': 1628774400}
-
-    run(config_dict=config_dict, wandb_project=WANDB_PROJECT_RUN, save_model=True, unique_name=False)
-else:
-    ABLATION = 0
-    PHASE = 'full'
-    TEST_SET = True
-
-    threshold_list = {'p1': 0.2, 'p2': 0.35, 'full': 0.5}  # full = p1 + p2
-    THRESHOLD = threshold_list[PHASE]
-    # WANDB_PROJECT_RUN = f"tests_yann"
-
-    filename_regression_dataset = f"dataset_regression_{PHASE}_big_250_matlab_standardized_envelope_pf.txt"
-    filename_classification_dataset = f"dataset_classification_{PHASE}_big_250_matlab_standardized_envelope_pf.txt"
-    subject_list = f"subject_sequence_{PHASE}_big.txt"
-    subject_list_p1 = f"subject_sequence_p1_big.txt"
-    subject_list_p2 = f"subject_sequence_p2_big.txt"
diff --git a/portiloop_software/portiloop_python/ANN/training_experiment.py b/portiloop_software/portiloop_python/ANN/training_experiment.py
new file mode 100644
index 0000000..55da314
--- /dev/null
+++ b/portiloop_software/portiloop_python/ANN/training_experiment.py
@@ -0,0 +1,852 @@
+"""
+Main script for training an ANN.
+"""
+
+# all imports
+
+import copy
+from distutils.command.config import config
+import json
+import logging
+import os
+import time
+from argparse import ArgumentParser
+from pathlib import Path
+from random import seed
+
+import numpy as np
+import torch
+import torch.nn as nn
+import torch.optim as optim
+from torch.nn import functional as F
+
+from scipy.ndimage import gaussian_filter1d
+
+from portiloop_software.portiloop_python.Utils.utils import out_dim
+from portiloop_software.portiloop_python.ANN.dataset import LabelDistributionSmoothing, generate_dataloader, generate_dataloader_unlabelled_offline
+from portiloop_software.portiloop_python.ANN.nn_utils import LoggerWandb, SurpriseReweighting, get_metrics
+from portiloop_software.portiloop_python.ANN.configs import get_nn_dict
+
+
+# all classes and functions:
+class ConvPoolModule(nn.Module):
+    def __init__(self,
+                 in_channels,
+                 out_channel,
+                 kernel_conv,
+                 stride_conv,
+                 conv_padding,
+                 dilation_conv,
+                 kernel_pool,
+                 stride_pool,
+                 pool_padding,
+                 dilation_pool,
+                 dropout_p):
+        super(ConvPoolModule, self).__init__()
+
+        self.conv = nn.Conv1d(in_channels=in_channels,
+                              out_channels=out_channel,
+                              kernel_size=kernel_conv,
+                              stride=stride_conv,
+                              padding=conv_padding,
+                              dilation=dilation_conv)
+        self.pool = nn.MaxPool1d(kernel_size=kernel_pool,
+                                 stride=stride_pool,
+                                 padding=pool_padding,
+                                 dilation=dilation_pool)
+        self.dropout = nn.Dropout(dropout_p)
+
+    def forward(self, input_f):
+        x, max_value = input_f
+        x = F.relu(self.conv(x))
+        x = self.pool(x)
+        max_temp = torch.max(abs(x))
+        if max_temp > max_value:
+            logging.debug(f"max_value = {max_temp}")
+            max_value = max_temp
+        return self.dropout(x), max_value
+
+
+class FcModule(nn.Module):
+    def __init__(self,
+                 in_features,
+                 out_features,
+                 dropout_p):
+        super(FcModule, self).__init__()
+
+        self.fc = nn.Linear(in_features=in_features, out_features=out_features)
+        self.dropout = nn.Dropout(dropout_p)
+
+    def forward(self, x):
+        x = F.relu(self.fc(x))
+        return self.dropout(x)
+
+
+class PortiloopNetwork(nn.Module):
+    def __init__(self, c_dict, exp_config):
+        super(PortiloopNetwork, self).__init__()
+
+        self.exp_config = exp_config
+
+        RNN = c_dict["RNN"]
+        stride_pool = c_dict["stride_pool"]
+        stride_conv = c_dict["stride_conv"]
+        kernel_conv = c_dict["kernel_conv"]
+        kernel_pool = c_dict["kernel_pool"]
+        nb_channel = c_dict["nb_channel"]
+        hidden_size = c_dict["hidden_size"]
+        window_size_s = c_dict["window_size_s"]
+        dropout_p = c_dict["dropout"]
+        dilation_conv = c_dict["dilation_conv"]
+        dilation_pool = c_dict["dilation_pool"]
+        fe = c_dict["fe"]
+        nb_conv_layers = c_dict["nb_conv_layers"]
+        nb_rnn_layers = c_dict["nb_rnn_layers"]
+        first_layer_dropout = c_dict["first_layer_dropout"]
+        self.envelope_input = c_dict["envelope_input"]
+        self.power_features_input = c_dict["power_features_input"]
+        self.classification = c_dict["classification"]
+
+        conv_padding = 0  # int(kernel_conv // 2)
+        pool_padding = 0  # int(kernel_pool // 2)
+        window_size = int(window_size_s * fe)
+        nb_out = window_size
+
+        for _ in range(nb_conv_layers):
+            nb_out = out_dim(nb_out, conv_padding,
+                             dilation_conv, kernel_conv, stride_conv)
+            nb_out = out_dim(nb_out, pool_padding,
+                             dilation_pool, kernel_pool, stride_pool)
+
+        output_cnn_size = int(nb_channel * nb_out)
+
+        self.RNN = RNN
+        self.first_layer_input1 = ConvPoolModule(in_channels=1,
+                                                 out_channel=nb_channel,
+                                                 kernel_conv=kernel_conv,
+                                                 stride_conv=stride_conv,
+                                                 conv_padding=conv_padding,
+                                                 dilation_conv=dilation_conv,
+                                                 kernel_pool=kernel_pool,
+                                                 stride_pool=stride_pool,
+                                                 pool_padding=pool_padding,
+                                                 dilation_pool=dilation_pool,
+                                                 dropout_p=dropout_p if first_layer_dropout else 0)
+        self.seq_input1 = nn.Sequential(*(ConvPoolModule(in_channels=nb_channel,
+                                                         out_channel=nb_channel,
+                                                         kernel_conv=kernel_conv,
+                                                         stride_conv=stride_conv,
+                                                         conv_padding=conv_padding,
+                                                         dilation_conv=dilation_conv,
+                                                         kernel_pool=kernel_pool,
+                                                         stride_pool=stride_pool,
+                                                         pool_padding=pool_padding,
+                                                         dilation_pool=dilation_pool,
+                                                         dropout_p=dropout_p) for _ in range(nb_conv_layers - 1)))
+        if RNN:
+            self.gru_input1 = nn.GRU(input_size=output_cnn_size,
+                                     hidden_size=hidden_size,
+                                     num_layers=nb_rnn_layers,
+                                     dropout=0,
+                                     batch_first=True)
+        #       fc_size = hidden_size
+        else:
+            self.first_fc_input1 = FcModule(
+                in_features=output_cnn_size, out_features=hidden_size, dropout_p=dropout_p)
+            self.seq_fc_input1 = nn.Sequential(
+                *(FcModule(in_features=hidden_size, out_features=hidden_size, dropout_p=dropout_p) for _ in range(nb_rnn_layers - 1)))
+        if self.envelope_input:
+            self.first_layer_input2 = ConvPoolModule(in_channels=1,
+                                                     out_channel=nb_channel,
+                                                     kernel_conv=kernel_conv,
+                                                     stride_conv=stride_conv,
+                                                     conv_padding=conv_padding,
+                                                     dilation_conv=dilation_conv,
+                                                     kernel_pool=kernel_pool,
+                                                     stride_pool=stride_pool,
+                                                     pool_padding=pool_padding,
+                                                     dilation_pool=dilation_pool,
+                                                     dropout_p=dropout_p if first_layer_dropout else 0)
+            self.seq_input2 = nn.Sequential(*(ConvPoolModule(in_channels=nb_channel,
+                                                             out_channel=nb_channel,
+                                                             kernel_conv=kernel_conv,
+                                                             stride_conv=stride_conv,
+                                                             conv_padding=conv_padding,
+                                                             dilation_conv=dilation_conv,
+                                                             kernel_pool=kernel_pool,
+                                                             stride_pool=stride_pool,
+                                                             pool_padding=pool_padding,
+                                                             dilation_pool=dilation_pool,
+                                                             dropout_p=dropout_p) for _ in range(nb_conv_layers - 1)))
+
+            if RNN:
+                self.gru_input2 = nn.GRU(input_size=output_cnn_size,
+                                         hidden_size=hidden_size,
+                                         num_layers=nb_rnn_layers,
+                                         dropout=0,
+                                         batch_first=True)
+            else:
+                self.first_fc_input2 = FcModule(
+                    in_features=output_cnn_size, out_features=hidden_size, dropout_p=dropout_p)
+                self.seq_fc_input2 = nn.Sequential(
+                    *(FcModule(in_features=hidden_size, out_features=hidden_size, dropout_p=dropout_p) for _ in range(nb_rnn_layers - 1)))
+        fc_features = 0
+        fc_features += hidden_size
+        if self.envelope_input:
+            fc_features += hidden_size
+        if self.power_features_input:
+            fc_features += 1
+        out_features = 1
+        self.fc = nn.Linear(in_features=fc_features,  # enveloppe and signal + power features ratio
+                            out_features=out_features)  # probability of being a spindle
+
+    def forward(self, x1, x2, x3, h1, h2, max_value=np.inf):
+        # x1 : input 1 : cleaned signal
+        # x2 : input 2 : envelope
+        # x3 : power features ratio
+        # h1 : gru 1 hidden size
+        # h2 : gru 2 hidden size
+        # max_value (optional) : print the maximal value reach during inference (used to verify if the FPGA implementation precision is enough)
+        (batch_size, sequence_len, features) = x1.shape
+
+        if self.exp_config['ablation'] == 1:
+            x1 = copy.deepcopy(x2)
+        elif self.exp_config['ablation'] == 2:
+            x2 = copy.deepcopy(x1)
+
+        x1 = x1.view(-1, 1, features)
+        x1, max_value = self.first_layer_input1((x1, max_value))
+        x1, max_value = self.seq_input1((x1, max_value))
+
+        x1 = torch.flatten(x1, start_dim=1, end_dim=-1)
+        hn1 = None
+        if self.RNN:
+            x1 = x1.view(batch_size, sequence_len, -1)
+            x1, hn1 = self.gru_input1(x1, h1)
+            max_temp = torch.max(abs(x1))
+            if max_temp > max_value:
+                logging.debug(f"max_value = {max_temp}")
+                max_value = max_temp
+            x1 = x1[:, -1, :]
+        else:
+            x1 = self.first_fc_input1(x1)
+            x1 = self.seq_fc_input1(x1)
+        x = x1
+        hn2 = None
+        if self.envelope_input:
+            x2 = x2.view(-1, 1, features)
+            x2, max_value = self.first_layer_input2((x2, max_value))
+            x2, max_value = self.seq_input2((x2, max_value))
+
+            x2 = torch.flatten(x2, start_dim=1, end_dim=-1)
+            if self.RNN:
+                x2 = x2.view(batch_size, sequence_len, -1)
+                x2, hn2 = self.gru_input2(x2, h2)
+                max_temp = torch.max(abs(x2))
+                if max_temp > max_value:
+                    logging.debug(f"max_value = {max_temp}")
+                    max_value = max_temp
+                x2 = x2[:, -1, :]
+            else:
+                x2 = self.first_fc_input2(x2)
+                x2 = self.seq_fc_input2(x2)
+            x = torch.cat((x, x2), -1)
+
+        if self.power_features_input:
+            x3 = x3.view(-1, 1)
+            x = torch.cat((x, x3), -1)
+
+        x = self.fc(x)  # output size: 1
+        max_temp = torch.max(abs(x))
+        if max_temp > max_value:
+            logging.debug(f"max_value = {max_temp}")
+            max_value = max_temp
+        x = torch.sigmoid(x)
+
+        return x, hn1, hn2, max_value
+
+
+def run_inference(exp_config, dataloader, criterion, net, device, hidden_size, nb_rnn_layers, classification, batch_size_validation, max_value=np.inf):
+    net_copy = copy.deepcopy(net)
+    net_copy = net_copy.to(device)
+    net_copy = net_copy.eval()
+    loss = 0
+    n = 0
+    batch_labels_total = torch.tensor([], device=device)
+    output_total = torch.tensor([], device=device)
+    h1 = torch.zeros((nb_rnn_layers, batch_size_validation,
+                     hidden_size), device=device)
+    h2 = torch.zeros((nb_rnn_layers, batch_size_validation,
+                     hidden_size), device=device)
+    with torch.no_grad():
+        for batch_data in dataloader:
+            batch_samples_input1, batch_samples_input2, batch_samples_input3, batch_labels = batch_data
+            batch_samples_input1 = batch_samples_input1.to(
+                device=device).float()
+            batch_samples_input2 = batch_samples_input2.to(
+                device=device).float()
+            batch_samples_input3 = batch_samples_input3.to(
+                device=device).float()
+            batch_labels = batch_labels.to(device=device).float()
+            if classification:
+                batch_labels = (batch_labels > exp_config['threshold'])
+                batch_labels = batch_labels.float()
+            output, h1, h2, max_value = net_copy(
+                batch_samples_input1, batch_samples_input2, batch_samples_input3, h1, h2, max_value)
+            # logging.debug(f"label = {batch_labels}")
+            # logging.debug(f"output = {output}")
+            output = output.view(-1)
+            loss_py = criterion(output, batch_labels).mean()
+            loss += loss_py.item()
+            # logging.debug(f"loss = {loss}")
+            if not classification:
+                output = (output > exp_config['threshold'])
+                batch_labels = (batch_labels > exp_config['threshold'])
+            else:
+                output = (output >= 0.5)
+            batch_labels_total = torch.cat([batch_labels_total, batch_labels])
+            output_total = torch.cat([output_total, output])
+            # logging.debug(f"batch_label_total : {batch_labels_total}")
+            # logging.debug(f"output_total : {output_total}")
+            n += 1
+
+    loss /= n
+    acc = (output_total == batch_labels_total).float().mean()
+    output_total = output_total.float()
+    batch_labels_total = batch_labels_total.float()
+    tp = (batch_labels_total * output_total)
+    tn = ((1 - batch_labels_total) * (1 - output_total))
+    fp = ((1 - batch_labels_total) * output_total)
+    fn = (batch_labels_total * (1 - output_total))
+    return output_total, batch_labels_total, loss, acc, tp, tn, fp, fn
+
+
+def run_inference_unlabelled_offline(dataloader, net, device, hidden_size, nb_rnn_layers, classification, batch_size_validation):
+    net_copy = copy.deepcopy(net)
+    net_copy = net_copy.to(device)
+    net_copy = net_copy.eval()
+    true_idx_total = torch.tensor([], device=device)
+    output_total = torch.tensor([], device=device)
+    h1 = torch.zeros((nb_rnn_layers, batch_size_validation,
+                     hidden_size), device=device)
+    h2 = torch.zeros((nb_rnn_layers, batch_size_validation,
+                     hidden_size), device=device)
+    max_value = np.inf
+    with torch.no_grad():
+        for batch_data in dataloader:
+            batch_samples_input1, batch_true_idx = batch_data
+            batch_samples_input1 = batch_samples_input1.to(
+                device=device).float()
+            output, h1, h2, max_value = net_copy(
+                batch_samples_input1, None, None, h1, h2, max_value)
+            output = output.view(-1)
+            # if not classification:
+            #     output = output  # (output > THRESHOLD)
+            # else:
+            #     output = (output >= 0.5)
+            true_idx_total = torch.cat([true_idx_total, batch_true_idx])
+            output_total = torch.cat([output_total, output])
+    output_total = output_total.float()
+    true_idx_total = true_idx_total.int()
+    return output_total, true_idx_total
+
+
+def run(nn_config, data_config, exp_config, wandb_project, save_model, unique_name):
+    global precision_validation_factor
+    global recall_validation_factor
+    _t_start = time.time()
+    logging.debug(f"nn_config: {nn_config}")
+    experiment_name = f"{nn_config['experiment_name']}_{time.time_ns()}" if unique_name else nn_config['experiment_name']
+    nb_epoch_max = nn_config["nb_epoch_max"]
+    nb_batch_per_epoch = nn_config["nb_batch_per_epoch"]
+    nb_epoch_early_stopping_stop = nn_config["nb_epoch_early_stopping_stop"]
+    early_stopping_smoothing_factor = nn_config["early_stopping_smoothing_factor"]
+    batch_size = nn_config["batch_size"]
+    seq_len = nn_config["seq_len"]
+    window_size_s = nn_config["window_size_s"]
+    fe = nn_config["fe"]
+    seq_stride_s = nn_config["seq_stride_s"]
+    lr_adam = nn_config["lr_adam"]
+    hidden_size = nn_config["hidden_size"]
+    device_val = nn_config["device_val"]
+    device_train = nn_config["device_train"]
+    max_duration = nn_config["max_duration"]
+    nb_rnn_layers = nn_config["nb_rnn_layers"]
+    adam_w = nn_config["adam_w"]
+    distribution_mode = nn_config["distribution_mode"]
+    classification = nn_config["classification"]
+    reg_balancing = nn_config["reg_balancing"]
+    split_idx = nn_config["split_idx"]
+    validation_network_stride = nn_config["validation_network_stride"]
+
+    assert reg_balancing in {'none', 'lds',
+                             'sr'}, f"wrong key: {reg_balancing}"
+    assert classification or distribution_mode == 1, "distribution_mode must be 1 (no class balancing) in regression mode"
+    balancer_type = 0
+    lds = None
+    sr = None
+    if reg_balancing == 'lds':
+        balancer_type = 1
+    elif reg_balancing == 'sr':
+        balancer_type = 2
+
+    window_size = int(window_size_s * fe)
+    seq_stride = int(seq_stride_s * fe)
+
+    if device_val.startswith("cuda") or device_train.startswith("cuda"):
+        assert torch.cuda.is_available(), "CUDA unavailable"
+
+    logger = LoggerWandb(experiment_name, nn_config,
+                         wandb_project, data_config)
+    torch.seed()
+    net = PortiloopNetwork(nn_config, exp_config).to(device=device_train)
+    criterion = nn.MSELoss(
+        reduction='none') if not classification else nn.BCELoss(reduction='none')
+    # criterion = nn.MSELoss() if not classification else nn.BCELoss()
+    optimizer = optim.AdamW(net.parameters(), lr=lr_adam, weight_decay=adam_w)
+    best_loss_early_stopping = 1
+    best_epoch_early_stopping = 0
+    best_model_precision_validation = 0
+    best_model_f1_score_validation = 0
+    best_model_recall_validation = 0
+    best_model_loss_validation = 1
+
+    best_model_on_loss_accuracy = 0
+    best_model_on_loss_precision_validation = 0
+    best_model_on_loss_f1_score_validation = 0
+    best_model_on_loss_recall_validation = 0
+    best_model_on_loss_loss_validation = 1
+
+    first_epoch = 0
+    try:
+        logger.restore(classification)
+        file_exp = experiment_name
+        file_exp += "" if classification else "_on_loss"
+        if not device_val.startswith("cuda"):
+            checkpoint = torch.load(
+                data_config['path_dataset'] / file_exp, map_location=torch.device('cpu'))
+        else:
+            checkpoint = torch.load(data_config['path_dataset'] / file_exp)
+        logging.debug("Use checkpoint model")
+        net.load_state_dict(checkpoint['model_state_dict'])
+        optimizer.load_state_dict(checkpoint['optimizer_state_dict'])
+        first_epoch = checkpoint['epoch'] + 1
+        recall_validation_factor = checkpoint['recall_validation_factor']
+        precision_validation_factor = checkpoint['precision_validation_factor']
+        best_model_on_loss_loss_validation = checkpoint['best_model_on_loss_loss_validation']
+        best_model_f1_score_validation = checkpoint['best_model_f1_score_validation']
+    except (ValueError, FileNotFoundError):
+        #    net = PortiloopNetwork(config_dict).to(device=device_train)
+        logging.debug("Create new model")
+    net = net.train()
+    nb_weights = 0
+    for i in net.parameters():
+        nb_weights += len(i)
+    has_envelope = 1
+    if nn_config["envelope_input"]:
+        has_envelope = 2
+    nn_config["estimator_size_memory"] = nb_weights * \
+        window_size * seq_len * batch_size * has_envelope
+
+    train_loader, validation_loader, batch_size_validation, _, _, _ = generate_dataloader(data_config, exp_config, window_size, fe, seq_len, seq_stride, distribution_mode,
+                                                                                          batch_size, nb_batch_per_epoch, classification, split_idx,
+                                                                                          validation_network_stride)
+    if balancer_type == 1:
+        lds = LabelDistributionSmoothing(c=1.0, dataset=train_loader.dataset, weights=None, kernel_size=5, kernel_std=0.01, nb_bins=100,
+                                         weighting_mode='inv_sqrt')
+    elif balancer_type == 2:
+        sr = SurpriseReweighting(weights=None, nb_bins=100, alpha=1e-3)
+
+    best_model_accuracy = 0
+    best_epoch = 0
+    best_model = None
+
+    accuracy_train = None
+    loss_train = None
+
+    early_stopping_counter = 0
+    loss_early_stopping = None
+    h1_zero = torch.zeros(
+        (nb_rnn_layers, batch_size, hidden_size), device=device_train)
+    h2_zero = torch.zeros(
+        (nb_rnn_layers, batch_size, hidden_size), device=device_train)
+    for epoch in range(first_epoch, first_epoch + nb_epoch_max):
+
+        logging.debug(f"epoch: {epoch}")
+
+        n = 0
+        if epoch > -1:
+            accuracy_train = 0
+            loss_train = 0
+            _t_start = time.time()
+            for batch_data in train_loader:
+                batch_samples_input1, batch_samples_input2, batch_samples_input3, batch_labels = batch_data
+                batch_samples_input1 = batch_samples_input1.to(
+                    device=device_train).float()
+                batch_samples_input2 = batch_samples_input2.to(
+                    device=device_train).float()
+                batch_samples_input3 = batch_samples_input3.to(
+                    device=device_train).float()
+                batch_labels = batch_labels.to(device=device_train).float()
+
+                optimizer.zero_grad()
+                if classification:
+                    batch_labels = (batch_labels > exp_config['threshold'])
+                    batch_labels = batch_labels.float()
+
+                output, _, _, _ = net(
+                    batch_samples_input1, batch_samples_input2, batch_samples_input3, h1_zero, h2_zero)
+
+                output = output.view(-1)
+
+                loss = criterion(output, batch_labels)
+
+                if balancer_type == 1:
+                    batch_weights = lds.lds_weights_batch(batch_labels)
+                    loss = loss * batch_weights
+                    error = batch_weights.isinf().any().item() or batch_weights.isnan().any().item() or torch.isnan(
+                        loss).any().item() or torch.isinf(loss).any().item()
+                    if error:
+                        logging.debug(f"batch_labels: {batch_labels}")
+                        logging.debug(f"batch_weights: {batch_weights}")
+                        logging.debug(f"loss: {loss}")
+                        logging.debug(f"LDS: {lds}")
+                        assert False, "loss is nan or inf"
+                elif balancer_type == 2:
+                    loss = sr.update_and_get_weighted_loss(
+                        batch_labels=batch_labels, unweighted_loss=loss)
+                    error = torch.isnan(loss).any().item(
+                    ) or torch.isinf(loss).any().item()
+                    if error:
+                        logging.debug(f"batch_labels: {batch_labels}")
+                        logging.debug(f"loss: {loss}")
+                        logging.debug(f"SR: {sr}")
+                        assert False, "loss is nan or inf"
+
+                loss = loss.mean()
+
+                loss_train += loss.item()
+                loss.backward()
+                optimizer.step()
+
+                if not classification:
+                    output = (output > exp_config['threshold'])
+                    batch_labels = (batch_labels > exp_config['threshold'])
+                else:
+                    output = (output >= 0.5)
+                accuracy_train += (output == batch_labels).float().mean()
+                n += 1
+            _t_stop = time.time()
+            logging.debug(
+                f"Training time for 1 epoch : {_t_stop - _t_start} s")
+            accuracy_train /= n
+            loss_train /= n
+
+            _t_start = time.time()
+        output_validation, labels_validation, loss_validation, accuracy_validation, tp, tn, fp, fn = run_inference(exp_config, validation_loader, criterion, net,
+                                                                                                                   device_val, hidden_size,
+                                                                                                                   nb_rnn_layers, classification,
+                                                                                                                   batch_size_validation)
+        f1_validation, precision_validation, recall_validation = get_metrics(
+            tp, fp, fn)
+
+        _t_stop = time.time()
+        logging.debug(f"Validation time for 1 epoch : {_t_stop - _t_start} s")
+
+        recall_validation_factor = recall_validation
+        precision_validation_factor = precision_validation
+        updated_model = False
+        if f1_validation > best_model_f1_score_validation:
+            best_model = copy.deepcopy(net)
+            best_epoch = epoch
+            # torch.save(best_model.state_dict(), path_dataset / experiment_name, _use_new_zipfile_serialization=False)
+            if save_model:
+                torch.save({
+                    'epoch': epoch,
+                    'model_state_dict': best_model.state_dict(),
+                    'optimizer_state_dict': optimizer.state_dict(),
+                    'recall_validation_factor': recall_validation_factor,
+                    'precision_validation_factor': precision_validation_factor,
+                    'best_model_on_loss_loss_validation': best_model_on_loss_loss_validation,
+                    'best_model_f1_score_validation': best_model_f1_score_validation,
+                }, data_config['path_dataset'] / experiment_name, _use_new_zipfile_serialization=False)
+                updated_model = True
+            best_model_f1_score_validation = f1_validation
+            best_model_precision_validation = precision_validation
+            best_model_recall_validation = recall_validation
+            best_model_loss_validation = loss_validation
+            best_model_accuracy = accuracy_validation
+        if loss_validation < best_model_on_loss_loss_validation:
+            best_model = copy.deepcopy(net)
+            best_epoch = epoch
+            # torch.save(best_model.state_dict(), path_dataset / experiment_name, _use_new_zipfile_serialization=False)
+            if save_model:
+                torch.save({
+                    'epoch': epoch,
+                    'model_state_dict': best_model.state_dict(),
+                    'optimizer_state_dict': optimizer.state_dict(),
+                    'recall_validation_factor': recall_validation_factor,
+                    'precision_validation_factor': precision_validation_factor,
+                    'best_model_on_loss_loss_validation': best_model_on_loss_loss_validation,
+                    'best_model_f1_score_validation': best_model_f1_score_validation,
+                }, data_config['path_dataset'] / (experiment_name + "_on_loss"), _use_new_zipfile_serialization=False)
+                updated_model = True
+            best_model_on_loss_f1_score_validation = f1_validation
+            best_model_on_loss_precision_validation = precision_validation
+            best_model_on_loss_recall_validation = recall_validation
+            best_model_on_loss_loss_validation = loss_validation
+            best_model_on_loss_accuracy = accuracy_validation
+
+        loss_early_stopping = loss_validation if loss_early_stopping is None and early_stopping_smoothing_factor == 1 else loss_validation if loss_early_stopping is None else loss_validation * early_stopping_smoothing_factor + loss_early_stopping * (
+            1.0 - early_stopping_smoothing_factor)
+
+        if loss_early_stopping < best_loss_early_stopping:
+            best_loss_early_stopping = loss_early_stopping
+            early_stopping_counter = 0
+            best_epoch_early_stopping = epoch
+        else:
+            early_stopping_counter += 1
+
+        logger.log(accuracy_train=accuracy_train,
+                   loss_train=loss_train,
+                   accuracy_validation=accuracy_validation,
+                   loss_validation=loss_validation,
+                   f1_validation=f1_validation,
+                   precision_validation=precision_validation,
+                   recall_validation=recall_validation,
+                   best_epoch=best_epoch,
+                   best_model=best_model,
+                   loss_early_stopping=loss_early_stopping,
+                   best_epoch_early_stopping=best_epoch_early_stopping,
+                   best_model_accuracy_validation=best_model_accuracy,
+                   best_model_f1_score_validation=best_model_f1_score_validation,
+                   best_model_precision_validation=best_model_precision_validation,
+                   best_model_recall_validation=best_model_recall_validation,
+                   best_model_loss_validation=best_model_loss_validation,
+                   best_model_on_loss_accuracy_validation=best_model_on_loss_accuracy,
+                   best_model_on_loss_f1_score_validation=best_model_on_loss_f1_score_validation,
+                   best_model_on_loss_precision_validation=best_model_on_loss_precision_validation,
+                   best_model_on_loss_recall_validation=best_model_on_loss_recall_validation,
+                   best_model_on_loss_loss_validation=best_model_on_loss_loss_validation,
+                   updated_model=updated_model)
+
+        if early_stopping_counter > nb_epoch_early_stopping_stop or time.time() - _t_start > max_duration:
+            logging.debug("Early stopping.")
+            break
+    logging.debug("Delete logger")
+    del logger
+    logging.debug("Logger deleted")
+    return best_model_loss_validation, best_model_f1_score_validation, best_epoch_early_stopping
+
+
+def run_offline_unlabelled(nn_config, path_experiments, unlabelled_segment):
+    logging.debug(f"nn_config: {nn_config}")
+    experiment_name = nn_config['experiment_name']
+    window_size_s = nn_config["window_size_s"]
+    fe = nn_config["fe"]
+    seq_stride_s = nn_config["seq_stride_s"]
+    hidden_size = nn_config["hidden_size"]
+    device_inference = nn_config["device_inference"]
+    nb_rnn_layers = nn_config["nb_rnn_layers"]
+    classification = nn_config["classification"]
+    validation_network_stride = nn_config["validation_network_stride"]
+
+    window_size = int(window_size_s * fe)
+    seq_stride = int(seq_stride_s * fe)
+
+    if device_inference.startswith("cuda"):
+        assert torch.cuda.is_available(), "CUDA unavailable"
+
+    torch.seed()
+    net = PortiloopNetwork(nn_config).to(device=device_inference)
+
+    file_exp = experiment_name
+    file_exp += "" if classification else "_on_loss"
+    path_experiments = Path(path_experiments)
+    if not device_inference.startswith("cuda"):
+        checkpoint = torch.load(
+            path_experiments / file_exp, map_location=torch.device('cpu'))
+    else:
+        checkpoint = torch.load(path_experiments / file_exp)
+    logging.debug("Use checkpoint model")
+    net.load_state_dict(checkpoint['model_state_dict'])
+
+    test_loader, batch_size_test = generate_dataloader_unlabelled_offline(unlabelled_segment=unlabelled_segment,
+                                                                          window_size=window_size,
+                                                                          seq_stride=seq_stride,
+                                                                          network_stride=validation_network_stride)
+
+    output_total, true_idx_total = run_inference_unlabelled_offline(dataloader=test_loader,
+                                                                    net=net,
+                                                                    device=device_inference,
+                                                                    hidden_size=hidden_size,
+                                                                    nb_rnn_layers=nb_rnn_layers,
+                                                                    classification=classification,
+                                                                    batch_size_validation=batch_size_test)
+    return output_total, true_idx_total
+
+
+def initialize_nn_config(experiment_name):
+    nn_config = {
+        'experiment_name': experiment_name,
+        'device_train': 'cuda:0',
+        'device_val': 'cuda:0',
+        'nb_epoch_max': 11,
+        'max_duration': 257400,
+        'nb_epoch_early_stopping_stop': 10,
+        'early_stopping_smoothing_factor': 0.1,
+        'fe': 250,
+        'nb_batch_per_epoch': 5000,
+        'batch_size': 256,
+        'first_layer_dropout': False,
+        'power_features_input': False,
+        'dropout': 0.5,
+        'adam_w': 0.01,
+        'distribution_mode': 0,
+        'classification': True,
+        'nb_conv_layers': 3,
+        'seq_len': 50,
+        'nb_channel': 16,
+        'hidden_size': 32,
+        'seq_stride_s': 0.08600000000000001,
+        'nb_rnn_layers': 1,
+        'validation_network_stride': 1,
+        'reg_balancing': 'none',
+        'RNN': True,
+        'envelope_input': True,
+        'lr_adam': 0.0007,
+        'window_size_s': 0.266,
+        'stride_pool': 1,
+        'stride_conv': 1,
+        'kernel_conv': 9,
+        'kernel_pool': 7,
+        'dilation_conv': 1,
+        'dilation_pool': 1,
+        'nb_out': 24,
+        'time_in_past': 4.300000000000001,
+        'estimator_size_memory': 1628774400}
+    return nn_config
+
+
+def initialize_dataset_config(phase, path_dataset=None, reg_filename=None, class_filename=None, sl=None, sl_p1=None, sl_p2=None):
+    # Initialize with default filename
+    if path_dataset is None:
+        path_dataset = Path(__file__).absolute(
+        ).parent.parent.parent / 'dataset'
+
+    if reg_filename is None:
+        reg_filename = f"dataset_regression_{phase}_big_250_matlab_standardized_envelope_pf.txt"
+    if class_filename is None:
+        class_filename = f"dataset_classification_{phase}_big_250_matlab_standardized_envelope_pf.txt"
+    if sl is None:
+        sl = f"subject_sequence_{phase}_big.txt"
+    if sl_p1 is None:
+        sl_p1 = f"subject_sequence_p1_big.txt"
+    if sl_p2 is None:
+        sl_p2 = f"subject_sequence_p2_big.txt"
+
+    return {'path_dataset': path_dataset,
+            'filename_regression_dataset': reg_filename,
+            'filename_classification_dataset': class_filename,
+            'subject_list': sl,
+            'subject_list_p1': sl_p1,
+            'subject_list_p2': sl_p2}
+
+
+def initialize_exp_config(ablation=0, phase='full', test_set=False):
+    # Initialize a dictionary with all hyperparameters of the experiment
+    threshold_list = {'p1': 0.2, 'p2': 0.35, 'full': 0.2}  # full = p1 + p2
+    config = {
+        'ablation': ablation,  # 0 : no ablation, 1 : remove input 1, 2 : remove input 2
+        'phase': phase,
+        'threshold': threshold_list[phase],
+        'len_segment': 115,
+        'test': test_set
+    }
+    return config
+
+# Example to run on google colab: https://colab.research.google.com/drive/1jlpZ_ng9yXJYxl3Mqscr-82ephg5PSkw?usp=sharing
+
+
+if __name__ == "__main__":
+
+    # Parser definition
+    parser = ArgumentParser()
+    parser.add_argument('--dataset_path', type=str, default=None)
+    parser.add_argument('--experiment_name', type=str,
+                        help='Experiment name for Wandb')
+    parser.add_argument('--experiment_index', type=int,
+                        help='Experiment index for Wandb')
+    parser.add_argument('--output_file', type=str, default=None)
+    parser.add_argument('--phase', type=str, default='full')
+    parser.add_argument('--ablation', type=int, default=0)
+    parser.add_argument('--max_split', type=int, default=10)
+    parser.add_argument('--config_nn', type=str, default=None)
+    parser.add_argument('--config_data', type=str, default=None)
+    parser.add_argument(
+        '--no_test_set', dest='test_set', action='store_false', default=True)
+    parser.add_argument(
+        '--save_config', dest='save_config', action='store_true', default=False)
+    # Group for classification argument
+    feature_class_parser = parser.add_mutually_exclusive_group(required=False)
+    feature_class_parser.add_argument(
+        '--classification', dest='classification', action='store_true')
+    feature_class_parser.add_argument(
+        '--regression', dest='classification', action='store_false')
+    parser.set_defaults(classification=True)
+    args = parser.parse_args()
+
+    # Initialize configuration dictionary for dataset
+    if args.config_data is None:
+        data_config = initialize_dataset_config(
+            args.phase, path_dataset=Path(args.dataset_path) if args.dataset_path is not None else None)
+    else:
+        data_config = json.loads(args.config_data)
+
+    # initialize output file for logging
+    if args.output_file is not None:
+        logging.basicConfig(format='%(levelname)s: %(message)s',
+                            filename=args.output_file, level=logging.DEBUG)
+    else:
+        logging.basicConfig(
+            format='%(levelname)s: %(message)s', level=logging.DEBUG)
+
+    # Initialize configuration dictionary for NN
+    exp_index = args.experiment_index
+    possible_split = [0, 2]
+    split_idx = possible_split[exp_index % 2]
+
+    if args.config_nn is None:
+        # Option with some random hyperparameters
+        nn_config = initialize_nn_config(args.experiment_name)
+    else:
+        try:
+            # Read from json file
+            nn_config = json.loads(args.config_nn)
+        except Exception:
+            # REad from one of defaults
+
+            nn_config = get_nn_dict(
+                args.config_nn, args.ablation, exp_index, split_idx)
+    nn_config['split_idx'] = split_idx
+
+    # Set classification mode and name of experiment
+    nn_config['distribution_mode'] = 0 if args.classification else 1
+    nn_config['classification'] = args.classification
+    nn_config['experiment_name'] += "_regression" if not args.classification else ""
+    nn_config['experiment_name'] += "_no_test" if not args.test_set else ""
+
+    exp_config = initialize_exp_config(
+        ablation=args.ablation, phase=args.phase, test_set=args.test_set)
+
+    if args.save_config:
+        with open(f"{args.experiment_name}_nn_config.json", "w") as outfile:
+            json.dump(nn_config, outfile)
+
+    logging.debug(f"classification: {args.classification}")
+
+    seed()  # reset the seed
+
+    # Start the run
+    run(nn_config=nn_config, data_config=data_config, exp_config=exp_config, wandb_project=f"{args.phase}-dataset-public",
+        save_model=True, unique_name=False)
diff --git a/portiloop_software/portiloop_python/PMBO/pareto_network.py b/portiloop_software/portiloop_python/PMBO/pareto_network.py
index fd68777..83800e1 100644
--- a/portiloop_software/portiloop_python/PMBO/pareto_network.py
+++ b/portiloop_software/portiloop_python/PMBO/pareto_network.py
@@ -25,6 +25,7 @@
     PORT_WORKER, SOCKET_TIMEOUT_CONNECT_WORKER, ACK_TIMEOUT_WORKER_TO_SERVER, IP_SERVER, ACK_TIMEOUT_META_TO_SERVER, select_and_send_or_close_socket, poll_and_recv_or_close_socket, get_connected_socket, LOOP_SLEEP_TIME_META, LOOP_SLEEP_TIME_WORKER, LOOP_SLEEP_TIME, SEND_ALIVE
 from pareto_search import LoggerWandbPareto, RUN_NAME, SurrogateModel, META_MODEL_DEVICE, train_surrogate, update_pareto, nb_parameters, MAX_NB_PARAMETERS, NB_SAMPLED_MODELS_PER_ITERATION, exp_max_pareto_efficiency, run, \
     load_network_files, dump_network_files, transform_config_dict_to_input, WANDB_PROJECT_PARETO, PARETO_ID
+from portiloop_software.portiloop_python.ANN.training_experiment import initialize_dataset_config, initialize_exp_config
 from portiloop_software.portiloop_python.Utils.utils import same_config_dict, sample_config_dict, MIN_NB_PARAMETERS, MAXIMIZE_F1_SCORE, PROFILE_META
 
 
@@ -53,7 +54,8 @@ def __init__(self, server_ip=None):
         logging.debug(f"public IP: {self.public_ip}")
         logging.debug(f"server IP: {self.server_ip}")
 
-        Thread(target=self.__run_thread, args=(), kwargs={}, daemon=True).start()
+        Thread(target=self.__run_thread, args=(),
+               kwargs={}, daemon=True).start()
         self.run()
 
     def __run_thread(self):
@@ -65,13 +67,15 @@ def __run_thread(self):
             ack_time = time.time()
             recv_time = time.time()
             wait_ack = False
-            s = get_connected_socket(SOCKET_TIMEOUT_CONNECT_META, self.server_ip, PORT_META)
+            s = get_connected_socket(
+                SOCKET_TIMEOUT_CONNECT_META, self.server_ip, PORT_META)
             if s is None:
                 logging.debug("get_connected_socket failed in Meta thread")
                 continue
             while True:
                 # send weights
-                self.__to_launch_lock.acquire()  # WEIGHTS LOCK...........................................................
+                # WEIGHTS LOCK...........................................................
+                self.__to_launch_lock.acquire()
                 if len(self.__to_launch) > 0:  # new experiments to send
                     if not wait_ack:
                         obj = self.__to_launch.pop(0)
@@ -80,13 +84,16 @@ def __run_thread(self):
                             wait_ack = True
                         else:
                             self.__to_launch_lock.release()
-                            logging.debug("select_and_send_or_close_socket failed in Meta")
+                            logging.debug(
+                                "select_and_send_or_close_socket failed in Meta")
                             break
                     else:
                         elapsed = time.time() - ack_time
-                        logging.debug(f"WARNING: object ready but ACK from last transmission not received. Elapsed:{elapsed}s")
+                        logging.debug(
+                            f"WARNING: object ready but ACK from last transmission not received. Elapsed:{elapsed}s")
                         if elapsed >= ACK_TIMEOUT_META_TO_SERVER:
-                            logging.debug("INFO: ACK timed-out, breaking connection")
+                            logging.debug(
+                                "INFO: ACK timed-out, breaking connection")
                             self.__to_launch_lock.release()
                             break
                 else:
@@ -100,16 +107,20 @@ def __run_thread(self):
                                 wait_ack = True
                             else:
                                 self.__to_launch_lock.release()
-                                logging.debug("select_and_send_or_close_socket failed in Meta")
+                                logging.debug(
+                                    "select_and_send_or_close_socket failed in Meta")
                                 break
                         else:
                             elapsed = time.time() - ack_time
-                            logging.debug(f"WARNING: object ready but ACK from last transmission not received. Elapsed:{elapsed}s")
+                            logging.debug(
+                                f"WARNING: object ready but ACK from last transmission not received. Elapsed:{elapsed}s")
                             if elapsed >= ACK_TIMEOUT_META_TO_SERVER:
-                                logging.debug("INFO: ACK timed-out, breaking connection")
+                                logging.debug(
+                                    "INFO: ACK timed-out, breaking connection")
                                 self.__to_launch_lock.release()
                                 break
-                self.__to_launch_lock.release()  # END LOCK.......................................................
+                # END LOCK.......................................................
+                self.__to_launch_lock.release()
                 # checks for samples batch
                 success, obj = poll_and_recv_or_close_socket(s)
                 if not success:
@@ -118,18 +129,22 @@ def __run_thread(self):
                 elif obj is not None and obj != 'ACK':  # received finished
                     logging.debug(f"DEBUG INFO: Meta interface received obj")
                     recv_time = time.time()
-                    self.__results_lock.acquire()  # LOCK.........................................................
+                    # LOCK.........................................................
+                    self.__results_lock.acquire()
                     self.__results += obj
-                    self.__results_lock.release()  # END LOCK.....................................................
+                    # END LOCK.....................................................
+                    self.__results_lock.release()
                     self.__must_launch_lock.acquire()
                     self.__must_launch = True
                     self.__must_launch_lock.release()
                 elif obj == 'ACK':
                     recv_time = time.time()
                     wait_ack = False
-                    logging.debug(f"INFO: transfer acknowledgment received after {time.time() - ack_time}s")
+                    logging.debug(
+                        f"INFO: transfer acknowledgment received after {time.time() - ack_time}s")
                 elif time.time() - recv_time > self.recv_timeout:
-                    logging.debug(f"Timeout in Meta, not received anything for too long")
+                    logging.debug(
+                        f"Timeout in Meta, not received anything for too long")
                     break
                 time.sleep(LOOP_SLEEP_TIME_META)
             s.close()
@@ -154,7 +169,8 @@ def run(self):
             meta_model = SurrogateModel()
             meta_model.to(META_MODEL_DEVICE)
             meta_model.train()
-            meta_model, meta_loss = train_surrogate(meta_model, deepcopy(finished_experiments))
+            meta_model, meta_loss = train_surrogate(
+                meta_model, deepcopy(finished_experiments))
             logging.debug(f"surrogate model loss: {meta_loss}")
 
         # main meta-learning procedure:
@@ -176,7 +192,8 @@ def run(self):
                 self.__results_lock.release()
                 for res in temp_results:
                     if 'best_epoch' in res.keys():
-                        logging.debug(f"best epoch for the model received : {res['best_epoch']}")
+                        logging.debug(
+                            f"best epoch for the model received : {res['best_epoch']}")
                     to_remove = -1
                     to_update = -1
                     for i, exp in enumerate(launched_experiments):
@@ -191,27 +208,33 @@ def run(self):
                     if to_remove >= 0:
                         launched_experiments.pop(to_remove)
                     if to_update >= 0:
-                        finished_experiments[to_update]["software_cost"] = min(finished_experiments[to_update]["software_cost"], res["software_cost"])
-                        pareto_front = update_pareto(finished_experiments[to_update]["software_cost"], pareto_front)
+                        finished_experiments[to_update]["software_cost"] = min(
+                            finished_experiments[to_update]["software_cost"], res["software_cost"])
+                        pareto_front = update_pareto(
+                            finished_experiments[to_update]["software_cost"], pareto_front)
                     else:
                         pareto_front = update_pareto(res, pareto_front)
                         finished_experiments.append(res)
                     dump_network_files(finished_experiments, pareto_front)
                     prev_exp = res
-                if len(finished_experiments) > 0 and prev_exp != {}:  # train before sampling a new model
+                # train before sampling a new model
+                if len(finished_experiments) > 0 and prev_exp != {}:
                     logging.debug("training new surrogate model...")
 
                     meta_model = SurrogateModel()
                     meta_model.to(META_MODEL_DEVICE)
 
                     meta_model.train()
-                    meta_model, meta_loss = train_surrogate(meta_model, deepcopy(finished_experiments))
+                    meta_model, meta_loss = train_surrogate(
+                        meta_model, deepcopy(finished_experiments))
 
                     logging.debug(f"surrogate model loss: {meta_loss}")
 
-                    logger.log(surrogate_loss=meta_loss, surprise=prev_exp["surprise"], all_experiments=finished_experiments, pareto_front=pareto_front)
+                    logger.log(surrogate_loss=meta_loss,
+                               surprise=prev_exp["surprise"], all_experiments=finished_experiments, pareto_front=pareto_front)
 
-                num_experiment = len(finished_experiments) + len(launched_experiments)
+                num_experiment = len(finished_experiments) + \
+                    len(launched_experiments)
                 logging.debug("---")
                 logging.debug(f"ITERATION N° {num_experiment}")
 
@@ -224,7 +247,8 @@ def run(self):
                     exp = {}
 
                     # sample model
-                    config_dict, unrounded = sample_config_dict(name=RUN_NAME + "_" + str(num_experiment), previous_exp=prev_exp, all_exp=finished_experiments + launched_experiments + exps)
+                    config_dict, unrounded = sample_config_dict(name=RUN_NAME + "_" + str(
+                        num_experiment), previous_exp=prev_exp, all_exp=finished_experiments + launched_experiments + exps)
 
                     nb_params = nb_parameters(config_dict)
                     if nb_params > MAX_NB_PARAMETERS or nb_params < MIN_NB_PARAMETERS:
@@ -244,7 +268,8 @@ def run(self):
                     if len(exps) >= NB_SAMPLED_MODELS_PER_ITERATION:
                         # select model
                         model_selected = True
-                        exp = exp_max_pareto_efficiency(exps, pareto_front, finished_experiments)
+                        exp = exp_max_pareto_efficiency(
+                            exps, pareto_front, finished_experiments)
 
                 logging.debug(f"config: {exp['config_dict']}")
                 logging.debug(f"nb parameters: {exp['cost_hardware']}")
@@ -269,7 +294,7 @@ def run(self):
 
 
 class Worker:
-    def __init__(self, server_ip=None):
+    def __init__(self, data_config, server_ip=None):
 
         self.public_ip = get('http://api.ipify.org').text
         self.local_ip = socket.gethostbyname(socket.gethostname())
@@ -281,11 +306,15 @@ def __init__(self, server_ip=None):
         self.__exp_to_run = None
         self.__exp_to_run_lock = Lock()
 
+        self.data_config = data_config
+        self.exp_config = initialize_exp_config()
+
         logging.debug(f"local IP: {self.local_ip}")
         logging.debug(f"public IP: {self.public_ip}")
         logging.debug(f"server IP: {self.server_ip}")
 
-        Thread(target=self.__run_thread, args=(), kwargs={}, daemon=True).start()
+        Thread(target=self.__run_thread, args=(),
+               kwargs={}, daemon=True).start()
         self.run()
 
     def __run_thread(self):
@@ -297,13 +326,15 @@ def __run_thread(self):
             ack_time = time.time()
             recv_time = time.time()
             wait_ack = False
-            s = get_connected_socket(SOCKET_TIMEOUT_CONNECT_WORKER, self.server_ip, PORT_WORKER)
+            s = get_connected_socket(
+                SOCKET_TIMEOUT_CONNECT_WORKER, self.server_ip, PORT_WORKER)
             if s is None:
                 logging.debug("get_connected_socket failed in worker")
                 continue
             while True:
                 # send buffer
-                self.__finished_exp_lock.acquire()  # BUFFER LOCK.............................................................
+                # BUFFER LOCK.............................................................
+                self.__finished_exp_lock.acquire()
                 if self.__finished_exp is not None:  # a new result is available
                     logging.debug("new result available")
                     if not wait_ack:
@@ -313,14 +344,17 @@ def __run_thread(self):
                             wait_ack = True
                         else:
                             self.__finished_exp_lock.release()
-                            logging.debug("select_and_send_or_close_socket failed in worker")
+                            logging.debug(
+                                "select_and_send_or_close_socket failed in worker")
                             break
                         self.__finished_exp = None
                     else:
                         elapsed = time.time() - ack_time
-                        logging.debug(f"WARNING: object ready but ACK from last transmission not received. Elapsed:{elapsed}s")
+                        logging.debug(
+                            f"WARNING: object ready but ACK from last transmission not received. Elapsed:{elapsed}s")
                         if elapsed >= ACK_TIMEOUT_WORKER_TO_SERVER:
-                            logging.debug("INFO: ACK timed-out, breaking connection")
+                            logging.debug(
+                                "INFO: ACK timed-out, breaking connection")
                             self.__finished_exp_lock.release()
                             break
                 else:
@@ -334,16 +368,20 @@ def __run_thread(self):
                                 wait_ack = True
                             else:
                                 self.__finished_exp_lock.release()
-                                logging.debug("select_and_send_or_close_socket failed in Meta")
+                                logging.debug(
+                                    "select_and_send_or_close_socket failed in Meta")
                                 break
                         else:
                             elapsed = time.time() - ack_time
-                            logging.debug(f"WARNING: object ready but ACK from last transmission not received. Elapsed:{elapsed}s")
+                            logging.debug(
+                                f"WARNING: object ready but ACK from last transmission not received. Elapsed:{elapsed}s")
                             if elapsed >= ACK_TIMEOUT_META_TO_SERVER:
-                                logging.debug("INFO: ACK timed-out, breaking connection")
+                                logging.debug(
+                                    "INFO: ACK timed-out, breaking connection")
                                 self.__finished_exp_lock.release()
                                 break
-                self.__finished_exp_lock.release()  # END BUFFER LOCK.........................................................
+                # END BUFFER LOCK.........................................................
+                self.__finished_exp_lock.release()
                 # checks for new experiments to launch
                 success, obj = poll_and_recv_or_close_socket(s)
                 if not success:
@@ -352,15 +390,19 @@ def __run_thread(self):
                 elif obj is not None and obj != 'ACK':
                     logging.debug(f"DEBUG INFO: worker received obj")
                     recv_time = time.time()
-                    self.__exp_to_run_lock.acquire()  # LOCK.......................................................
+                    # LOCK.......................................................
+                    self.__exp_to_run_lock.acquire()
                     self.__exp_to_run = obj
-                    self.__exp_to_run_lock.release()  # END LOCK...................................................
+                    # END LOCK...................................................
+                    self.__exp_to_run_lock.release()
                 elif obj == 'ACK':
                     recv_time = time.time()
                     wait_ack = False
-                    logging.debug(f"INFO: transfer acknowledgment received after {time.time() - ack_time}s")
+                    logging.debug(
+                        f"INFO: transfer acknowledgment received after {time.time() - ack_time}s")
                 elif time.time() - recv_time > self.recv_timeout:
-                    logging.debug(f"Timeout in worker, not received anything for too long")
+                    logging.debug(
+                        f"Timeout in worker, not received anything for too long")
                     break
                 time.sleep(LOOP_SLEEP_TIME_WORKER)
             s.close()
@@ -373,10 +415,14 @@ def run(self):
                 self.__exp_to_run = None
                 self.__exp_to_run_lock.release()
                 predicted_loss = exp['cost_software']
+
+                # TODO: Get a data config dict and a exp dict
                 logging.debug("Launch run")
-                best_loss, best_f1_score, exp["best_epoch"] = run(exp["config_dict"], f"{WANDB_PROJECT_PARETO}_runs_{PARETO_ID}", save_model=False, unique_name=True)
+                best_loss, best_f1_score, exp["best_epoch"] = run(
+                    exp["config_dict"], self.data_config, self.exp_config, f"{WANDB_PROJECT_PARETO}_runs_{PARETO_ID}", save_model=False, unique_name=True)
                 logging.debug("Run finished")
-                exp["cost_software"] = 1 - best_f1_score if MAXIMIZE_F1_SCORE else best_loss
+                exp["cost_software"] = 1 - \
+                    best_f1_score if MAXIMIZE_F1_SCORE else best_loss
                 exp['surprise'] = exp["cost_software"] - predicted_loss
                 self.__finished_exp_lock.acquire()
                 logging.debug("Before copying exp result")
@@ -388,12 +434,12 @@ def run(self):
             time.sleep(LOOP_SLEEP_TIME)
 
 
-def main(args):
+def main(args, data_config=None):
     if args.server:
         logging.debug("INFO: now running: server")
         Server()
     elif args.worker:
-        Worker(server_ip=args.ip_server)
+        Worker(data_config, server_ip=args.ip_server)
         logging.debug("INFO: now running: worker")
     elif args.meta:
         MetaLearner(server_ip=args.ip_server)
@@ -412,9 +458,18 @@ def main(args):
     parser.add_argument('--worker', action='store_true')
     parser.add_argument('--output_file', type=str, default=None)
     parser.add_argument('--ip_server', type=str, default=IP_SERVER)
+    parser.add_argument('--dataset_path', type=str, default=None)
+
     args = parser.parse_args()
     if args.output_file is not None:
-        logging.basicConfig(format='%(asctime)s %(levelname)s: %(message)s', filename=args.output_file, level=logging.DEBUG)
+        logging.basicConfig(format='%(asctime)s %(levelname)s: %(message)s',
+                            filename=args.output_file, level=logging.DEBUG)
     else:
-        logging.basicConfig(format='%(asctime)s %(levelname)s: %(message)s', level=logging.DEBUG)
-    main(args)
+        logging.basicConfig(
+            format='%(asctime)s %(levelname)s: %(message)s', level=logging.DEBUG)
+
+    if args.worker:
+        dataset_config = initialize_dataset_config(
+            dataset_path=args.dataset_path)
+
+    main(args, data_config=dataset_config)
diff --git a/portiloop_software/portiloop_python/PMBO/pareto_search.py b/portiloop_software/portiloop_python/PMBO/pareto_search.py
index 2ee75ed..e023d0a 100644
--- a/portiloop_software/portiloop_python/PMBO/pareto_search.py
+++ b/portiloop_software/portiloop_python/PMBO/pareto_search.py
@@ -20,7 +20,7 @@
 import wandb
 
 # all constants (no hyperparameters here!)
-from portiloop_software.portiloop_python.ANN.portiloop_detector_training import PortiloopNetwork, run
+from portiloop_software.portiloop_python.ANN.training_experiment import PortiloopNetwork, initialize_exp_config, run, initialize_dataset_config
 from portiloop_software.portiloop_python.Utils.utils import EPSILON_EXP_NOISE, MAX_NB_PARAMETERS, MIN_NB_PARAMETERS, sample_config_dict, MAXIMIZE_F1_SCORE
 
 THRESHOLD = 0.2
@@ -42,13 +42,18 @@
 PARETO_ID = "tests"
 RUN_NAME = f"pareto_search_{PARETO_ID}"
 
-NB_SAMPLED_MODELS_PER_ITERATION = 200  # number of models sampled per iteration, only the best predicted one is selected
+# number of models sampled per iteration, only the best predicted one is selected
+NB_SAMPLED_MODELS_PER_ITERATION = 200
 
-DEFAULT_META_EPOCHS = 100  # default number of meta-epochs before entering meta train/val training regime
-START_META_TRAIN_VAL_AFTER = 100  # minimum number of experiments in the dataset before using a validation set
+# default number of meta-epochs before entering meta train/val training regime
+DEFAULT_META_EPOCHS = 100
+# minimum number of experiments in the dataset before using a validation set
+START_META_TRAIN_VAL_AFTER = 100
 META_TRAIN_VAL_RATIO = 0.8  # portion of experiments in meta training sets
-MAX_META_EPOCHS = 500  # surrogate training will stop after this number of meta-training epochs if the model doesn't converge
-META_EARLY_STOPPING = 30  # meta early stopping after this number of unsuccessful meta epochs
+# surrogate training will stop after this number of meta-training epochs if the model doesn't converge
+MAX_META_EPOCHS = 500
+# meta early stopping after this number of unsuccessful meta epochs
+META_EARLY_STOPPING = 30
 
 
 class MetaDataset(Dataset):
@@ -60,7 +65,8 @@ def __len__(self):
         return len(self.data)
 
     def __getitem__(self, idx):
-        assert 0 <= idx <= len(self), f"Index out of range ({idx}/{len(self)})."
+        assert 0 <= idx <= len(
+            self), f"Index out of range ({idx}/{len(self)})."
         config_dict = self.data[idx]["config_dict"]
         x = transform_config_dict_to_input(config_dict)
         label = torch.tensor(self.data[idx]["cost_software"])
@@ -150,45 +156,52 @@ def dominates_pareto(experiment, pareto):
 
 
 def transform_config_dict_to_input(config_dict):
-    x = [#float(config_dict["seq_len"]),  # idk why, but needed
-         float(config_dict["nb_channel"]),
-         config_dict["hidden_size"],
-         int(config_dict["seq_stride_s"] * config_dict["fe"]),
-         config_dict["nb_rnn_layers"],
-         int(config_dict["window_size_s"] * config_dict["fe"]),
-         config_dict["nb_conv_layers"],
-         #config_dict["stride_pool"],
-         #config_dict["stride_conv"],
-         config_dict["kernel_conv"],
-         config_dict["kernel_pool"],
-         #config_dict["dilation_conv"],
-         #config_dict["dilation_pool"],
-         #int(config_dict['RNN']),
-         #int(config_dict['envelope_input']),
-         config_dict["lr_adam"],
-         config_dict["batch_size"]]
+    x = [  # float(config_dict["seq_len"]),  # idk why, but needed
+        float(config_dict["nb_channel"]),
+        config_dict["hidden_size"],
+        int(config_dict["seq_stride_s"] * config_dict["fe"]),
+        config_dict["nb_rnn_layers"],
+        int(config_dict["window_size_s"] * config_dict["fe"]),
+        config_dict["nb_conv_layers"],
+        # config_dict["stride_pool"],
+        # config_dict["stride_conv"],
+        config_dict["kernel_conv"],
+        config_dict["kernel_pool"],
+        # config_dict["dilation_conv"],
+        # config_dict["dilation_pool"],
+        # int(config_dict['RNN']),
+        # int(config_dict['envelope_input']),
+        config_dict["lr_adam"],
+        config_dict["batch_size"]]
     x = torch.tensor(x)
     return x
 
 
 def train_surrogate(net, all_experiments):
-    optimizer = torch.optim.SGD(net.parameters(), lr=0.05, momentum=0, dampening=0, weight_decay=0.01, nesterov=False)
+    optimizer = torch.optim.SGD(net.parameters(
+    ), lr=0.05, momentum=0, dampening=0, weight_decay=0.01, nesterov=False)
     criterion = nn.MSELoss()
     best_val_loss = np.inf
     best_model = None
     early_stopping_counter = 0
     random.shuffle(all_experiments)
-    max_epoch = MAX_META_EPOCHS if len(all_experiments) > START_META_TRAIN_VAL_AFTER else len(all_experiments)
+    max_epoch = MAX_META_EPOCHS if len(
+        all_experiments) > START_META_TRAIN_VAL_AFTER else len(all_experiments)
 
     for epoch in range(max_epoch):
         if len(all_experiments) > START_META_TRAIN_VAL_AFTER:
-            train_dataset = MetaDataset(all_experiments, start=0, end=META_TRAIN_VAL_RATIO)
-            validation_dataset = MetaDataset(all_experiments, start=META_TRAIN_VAL_RATIO, end=1)
-            train_loader = DataLoader(train_dataset, batch_size=1, shuffle=True, pin_memory=True, num_workers=0)
-            validation_loader = DataLoader(validation_dataset, batch_size=1, shuffle=True, pin_memory=True, num_workers=0)
+            train_dataset = MetaDataset(
+                all_experiments, start=0, end=META_TRAIN_VAL_RATIO)
+            validation_dataset = MetaDataset(
+                all_experiments, start=META_TRAIN_VAL_RATIO, end=1)
+            train_loader = DataLoader(
+                train_dataset, batch_size=1, shuffle=True, pin_memory=True, num_workers=0)
+            validation_loader = DataLoader(
+                validation_dataset, batch_size=1, shuffle=True, pin_memory=True, num_workers=0)
         else:
             train_dataset = MetaDataset(all_experiments, start=0, end=1)
-            train_loader = DataLoader(train_dataset, batch_size=1, shuffle=True, pin_memory=True, num_workers=0)
+            train_loader = DataLoader(
+                train_dataset, batch_size=1, shuffle=True, pin_memory=True, num_workers=0)
         losses = []
 
         net.train()
@@ -215,8 +228,10 @@ def train_surrogate(net, all_experiments):
             with torch.no_grad():
                 for batch_data in validation_loader:
                     batch_samples, batch_labels = batch_data
-                    batch_samples = batch_samples.to(device=META_MODEL_DEVICE).float()
-                    batch_labels = batch_labels.to(device=META_MODEL_DEVICE).float()
+                    batch_samples = batch_samples.to(
+                        device=META_MODEL_DEVICE).float()
+                    batch_labels = batch_labels.to(
+                        device=META_MODEL_DEVICE).float()
 
                     output = net(batch_samples)
                     output = output.view(-1)
@@ -235,10 +250,12 @@ def train_surrogate(net, all_experiments):
                 if early_stopping_counter >= META_EARLY_STOPPING:
                     net = best_model
                     mean_loss = best_val_loss
-                    logging.debug(f"DEBUG: meta training converged at epoch:{epoch} (-{META_EARLY_STOPPING})")
+                    logging.debug(
+                        f"DEBUG: meta training converged at epoch:{epoch} (-{META_EARLY_STOPPING})")
                     break
                 elif epoch == MAX_META_EPOCHS - 1:
-                    logging.debug(f"DEBUG: meta training did not converge after epoch:{epoch}")
+                    logging.debug(
+                        f"DEBUG: meta training did not converge after epoch:{epoch}")
                     break
     net.eval()
     return net, mean_loss
@@ -255,7 +272,8 @@ def wandb_plot_pareto(all_experiments, ordered_pareto_front):
     y_axis = [exp["cost_software"] for exp in ordered_pareto_front]
     plt.plot(x_axis, y_axis, 'ro-')
     # last dot
-    plt.plot(all_experiments[-1]["cost_hardware"], all_experiments[-1]["cost_software"], 'go')
+    plt.plot(all_experiments[-1]["cost_hardware"],
+             all_experiments[-1]["cost_software"], 'go')
 
     plt.xlabel(f"nb parameters")
     plt.ylabel(f"validation cost")
@@ -326,12 +344,14 @@ def pareto_efficiency(experiment, all_experiments):
 
 def exp_max_pareto_efficiency(experiments, pareto_front, all_experiments):
     assert len(experiments) >= 1
-    noise = random.choices(population=[True, False], weights=[EPSILON_EXP_NOISE, 1.0 - EPSILON_EXP_NOISE])[0]
+    noise = random.choices(population=[True, False], weights=[
+                           EPSILON_EXP_NOISE, 1.0 - EPSILON_EXP_NOISE])[0]
     if noise or len(pareto_front) == 0:
         return random.choice(experiments)
     else:
         assert len(all_experiments) != 0
-        histo = np.histogram([exp["cost_hardware"] for exp in all_experiments], bins=100, density=True, range=(0, MAX_NB_PARAMETERS))
+        histo = np.histogram([exp["cost_hardware"] for exp in all_experiments],
+                             bins=100, density=True, range=(0, MAX_NB_PARAMETERS))
 
         max_efficiency = -np.inf
         best_exp = None
@@ -347,7 +367,8 @@ def exp_max_pareto_efficiency(experiments, pareto_front, all_experiments):
                 best_efficiency = efficiency + nerf
                 best_nerf = nerf
         assert best_exp is not None
-        logging.debug(f"DEBUG: selected {best_exp['cost_hardware']}: efficiency:{best_efficiency}, nerf:{best_nerf}")
+        logging.debug(
+            f"DEBUG: selected {best_exp['cost_hardware']}: efficiency:{best_efficiency}, nerf:{best_nerf}")
         return best_exp
 
 
@@ -419,7 +440,8 @@ class LoggerWandbPareto:
     def __init__(self, run_name):
         self.run_name = run_name
         os.environ['WANDB_API_KEY'] = "cd105554ccdfeee0bbe69c175ba0c14ed41f6e00"
-        self.wandb_run = wandb.init(project=WANDB_PROJECT_PARETO, entity="portiloop", id=run_name, resume="allow", reinit=True)
+        self.wandb_run = wandb.init(
+            project=WANDB_PROJECT_PARETO, entity="portiloop", id=run_name, resume="allow", reinit=True)
 
     def log(self,
             surrogate_loss,
@@ -438,7 +460,7 @@ def __del__(self):
         self.wandb_run.finish()
 
 
-def iterative_training_local():
+def iterative_training_local(data_config, exp_config):
     logger = LoggerWandbPareto(RUN_NAME)
 
     all_experiments, pareto_front = load_network_files()
@@ -455,7 +477,8 @@ def iterative_training_local():
         meta_model = SurrogateModel()
         meta_model.to(META_MODEL_DEVICE)
         meta_model.train()
-        meta_model, meta_loss = train_surrogate(meta_model, deepcopy(all_experiments))
+        meta_model, meta_loss = train_surrogate(
+            meta_model, deepcopy(all_experiments))
         logging.debug(f"surrogate model loss: {meta_loss}")
 
     # main meta-learning procedure:
@@ -475,7 +498,8 @@ def iterative_training_local():
             exp = {}
 
             # sample model
-            config_dict, unrounded = sample_config_dict(name=RUN_NAME + "_" + str(num_experiment), previous_exp=prev_exp, all_exp=all_experiments)
+            config_dict, unrounded = sample_config_dict(
+                name=RUN_NAME + "_" + str(num_experiment), previous_exp=prev_exp, all_exp=all_experiments)
 
             nb_params = nb_parameters(config_dict)
             if nb_params > MAX_NB_PARAMETERS or nb_params < MIN_NB_PARAMETERS:
@@ -496,7 +520,8 @@ def iterative_training_local():
             if len(exps) >= NB_SAMPLED_MODELS_PER_ITERATION:
                 # select model
                 model_selected = True
-                exp = exp_max_pareto_efficiency(exps, pareto_front, all_experiments)
+                exp = exp_max_pareto_efficiency(
+                    exps, pareto_front, all_experiments)
 
         config_dict = exp["config_dict"]
         predicted_cost = exp["cost_software"]
@@ -507,8 +532,11 @@ def iterative_training_local():
         logging.debug(f"nb parameters: {nb_params}")
         logging.debug(f"predicted cost: {predicted_cost}")
         logging.debug("training...")
-        best_loss, best_f1_score, exp["best_epoch"] = run(exp["config_dict"], f"{WANDB_PROJECT_PARETO}_runs_{PARETO_ID}", save_model=False, unique_name=True)
-        exp["cost_software"] = 1 - best_f1_score if MAXIMIZE_F1_SCORE else best_loss
+        # TODO: Get the dataconfig and the experiment config
+        best_loss, best_f1_score, exp["best_epoch"] = run(
+            exp["config_dict"], data_config, exp_config, f"{WANDB_PROJECT_PARETO}_runs_{PARETO_ID}", save_model=False, unique_name=True)
+        exp["cost_software"] = 1 - \
+            best_f1_score if MAXIMIZE_F1_SCORE else best_loss
 
         pareto_front = update_pareto(exp, pareto_front)
         all_experiments.append(exp)
@@ -525,12 +553,14 @@ def iterative_training_local():
         meta_model.to(META_MODEL_DEVICE)
 
         meta_model.train()
-        meta_model, meta_loss = train_surrogate(meta_model, deepcopy(all_experiments))
+        meta_model, meta_loss = train_surrogate(
+            meta_model, deepcopy(all_experiments))
 
         logging.debug(f"surrogate model loss: {meta_loss}")
 
         dump_network_files(all_experiments, pareto_front)
-        logger.log(surrogate_loss=meta_loss, surprise=surprise, all_experiments=all_experiments, pareto_front=pareto_front)
+        logger.log(surrogate_loss=meta_loss, surprise=surprise,
+                   all_experiments=all_experiments, pareto_front=pareto_front)
 
     logging.debug(f"End of meta-training.")
 
@@ -539,11 +569,19 @@ def iterative_training_local():
 
 if __name__ == "__main__":
     parser = ArgumentParser()
+    parser.add_argument('--dataset_path', type=str, default=None)
     parser.add_argument('--output_file', type=str, default=None)
     args = parser.parse_args()
+
+    data_config = initialize_dataset_config(
+        args.phase, path_dataset=Path(args.dataset_path) if args.dataset_path is not None else None)
+    exp_config = initialize_exp_config()
+
     if args.output_file is not None:
-        logging.basicConfig(format='%(levelname)s: %(message)s', filename=args.output_file, level=logging.DEBUG)
+        logging.basicConfig(format='%(levelname)s: %(message)s',
+                            filename=args.output_file, level=logging.DEBUG)
     else:
-        logging.basicConfig(format='%(levelname)s: %(message)s', level=logging.DEBUG)
+        logging.basicConfig(
+            format='%(levelname)s: %(message)s', level=logging.DEBUG)
 
-    iterative_training_local()
+    iterative_training_local(data_config, exp_config)