[ENH] Add AEDRNNClusterer (#1784)

* Add AEDRNNNetwork * minor fix * minor * minor refactoring * add _* to private methods * precommit * minor fix * minor * minor * minor * minor * minor * Add dilation_rate_decoder kwarg * add kwargs * pre-commit * minor * temporal_latent_space * Adjust for temporal_latent_space * Add docstring * Add test cases for AEDRNNNetwork * Add skipif for pytest tests * minor * minor fix * minor * minor * minor * Add tests * minor * add tag * minor * fix bugs * update base * minor * minor * Add AEDRNNClusterer * typo * add to __init__ * minor: * modelcheckpoint callback fixes * minor fixes * fixes * Add AEDRNNClusterer example notebook * docstring * fixes * Update _ae_drnn.py * Fixes for reviews * fixes * Automatic `pre-commit` fixes * update network * Add estimator kwarg in clusterer * minor fixes * some fixes * fix notebooks * remove deprecated * Delete examples/clustering/deep_clustering.ipynb * Add metrics kwarg * remove return_X_y * Update _ae_drnn.py * Automatic `pre-commit` fixes --------- Co-authored-by: aadya940 <[email protected]>
aeon-toolkit · Nov 11, 2024 · c267ab8 · c267ab8
1 parent 4bf1b4a
commit c267ab8
Show file tree

Hide file tree

Showing 2 changed files with 357 additions and 0 deletions.
diff --git a/aeon/clustering/deep_learning/__init__.py b/aeon/clustering/deep_learning/__init__.py
@@ -4,11 +4,13 @@
     "BaseDeepClusterer",
     "AEFCNClusterer",
     "AEResNetClusterer",
+    "AEDRNNClusterer",
     "AEAttentionBiGRUClusterer",
     "AEBiGRUClusterer",
 ]
 from aeon.clustering.deep_learning._ae_abgru import AEAttentionBiGRUClusterer
 from aeon.clustering.deep_learning._ae_bgru import AEBiGRUClusterer
+from aeon.clustering.deep_learning._ae_drnn import AEDRNNClusterer
 from aeon.clustering.deep_learning._ae_fcn import AEFCNClusterer
 from aeon.clustering.deep_learning._ae_resnet import AEResNetClusterer
 from aeon.clustering.deep_learning.base import BaseDeepClusterer
diff --git a/aeon/clustering/deep_learning/_ae_drnn.py b/aeon/clustering/deep_learning/_ae_drnn.py
@@ -0,0 +1,355 @@
+"""Deep Learning Auto-Encoder using DRNN Network."""
+
+__maintainer__ = []
+__all__ = ["AEDRNNClusterer"]
+
+import gc
+import os
+import time
+from copy import deepcopy
+
+from sklearn.utils import check_random_state
+
+from aeon.clustering import DummyClusterer
+from aeon.clustering.deep_learning.base import BaseDeepClusterer
+from aeon.networks import AEDRNNNetwork
+from aeon.utils.validation._dependencies import _check_soft_dependencies
+
+if _check_soft_dependencies(["tensorflow"], severity="none"):
+    from aeon.networks._ae_drnn import _TensorDilation
+
+
+class AEDRNNClusterer(BaseDeepClusterer):
+    """Auto-Encoder based Dilated Recurrent Neural Network (DRNN).
+
+    Parameters
+    ----------
+    n_clusters : int, default=None
+        Number of clusters for the deep learnign model.
+    clustering_algorithm : str, default="deprecated"
+        Please use the 'estimator' parameter.
+    estimator : aeon clusterer, default=None
+        An aeon estimator to be built using the transformed data.
+        Defaults to aeon TimeSeriesKMeans() with euclidean distance
+        and mean averaging method and n_clusters set to 2.
+    clustering_params : dict, default=None
+        Please use 'estimator' parameter.
+    latent_space_dim : int, default=128
+        Dimension of the latent space of the auto-encoder.
+    temporal_latent_space : bool, default = False
+        Flag to choose whether the latent space is an MTS or Euclidean space.
+    n_layers_encoder : int, default = 3
+        Number of layers in the encoder.
+    n_layers_decoder : int, default = 3
+        Number of layers in the decoder.
+    dilation_rate_encoder : int or list of int, default = 1
+        The dilation rate for the encoder.
+    dilation_rate_decoder : int or list of int, default = 1
+        The dilation rate for the decoder.
+    activation_encoder : str or list of str, default = "relu"
+        Activation used after DRNN Layer in the encoder.
+    activation_decoder : str or list of str, default = "relu"
+        Activation used after DRNN Layer in the decoder.
+    n_units_encoder : list or int, default = None
+        Number of Units in each DRNN Layer of the encoder.
+    n_units_decoder : list or int, default = None
+        Number of Units in each DRNN Layer of the decoder.
+    n_epochs : int, default = 2000
+        The number of epochs to train the model.
+    batch_size : int, default = 16
+        The number of samples per gradient update.
+    use_mini_batch_size : bool, default = True,
+        Whether or not to use the mini batch size formula.
+    random_state : int, RandomState instance or None, default=None
+        If `int`, random_state is the seed used by the random number generator;
+        If `RandomState` instance, random_state is the random number generator;
+        If `None`, the random number generator is the `RandomState` instance used
+        by `np.random`.
+        Seeded random number generation can only be guaranteed on CPU processing,
+        GPU processing will be non-deterministic.
+    verbose : boolean, default = False
+        Whether to output extra information.
+    loss : string, default="mean_squared_error"
+        Fit parameter for the keras model.
+    metrics : keras metrics, default = ["mean_squared_error"]
+        will be set to mean_squared_error as default if None
+    optimizer : keras.optimizers object, default = Adam(lr=0.01)
+        Specify the optimizer and the learning rate to be used.
+    file_path : str, default = "./"
+        File path to save best model.
+    save_best_model : bool, default = False
+        Whether or not to save the best model, if the
+        modelcheckpoint callback is used by default,
+        this condition, if True, will prevent the
+        automatic deletion of the best saved model from
+        file and the user can choose the file name.
+    save_last_model : bool, default = False
+        Whether or not to save the last model, last
+        epoch trained, using the base class method
+        save_last_model_to_file.
+    best_file_name : str, default = "best_model"
+        The name of the file of the best model, if
+        save_best_model is set to False, this parameter
+        is discarded.
+    last_file_name : str, default = "last_model"
+        The name of the file of the last model, if
+        save_last_model is set to False, this parameter
+        is discarded.
+    callbacks : keras.callbacks, default = None
+        List of keras callbacks.
+
+    Examples
+    --------
+    >>> from aeon.clustering.deep_learning import AEDRNNClusterer
+    >>> from aeon.datasets import load_unit_test
+    >>> X_train, y_train = load_unit_test(split="train")
+    >>> X_test, y_test = load_unit_test(split="test")
+    >>> from aeon.clustering import DummyClusterer
+    >>> _clst = DummyClusterer(n_clusters=2)
+    >>> aefcn = AEDRNNClusterer(estimator = _clst,
+    ... n_epochs=20,batch_size=4)  # doctest: +SKIP
+    >>> aefcn.fit(X_train)  # doctest: +SKIP
+    AEDRNNClusterer(...)
+    """
+
+    def __init__(
+        self,
+        n_clusters=None,
+        estimator=None,
+        clustering_algorithm="deprecated",
+        clustering_params=None,
+        latent_space_dim=128,
+        temporal_latent_space=False,
+        n_layers_encoder=3,
+        n_layers_decoder=3,
+        dilation_rate_encoder=1,
+        dilation_rate_decoder=1,
+        n_units_encoder=None,
+        n_units_decoder=None,
+        activation_encoder="relu",
+        activation_decoder="relu",
+        n_epochs=2000,
+        batch_size=32,
+        use_mini_batch_size=False,
+        random_state=None,
+        verbose=False,
+        loss="mse",
+        metrics=None,
+        optimizer="Adam",
+        file_path="./",
+        save_best_model=False,
+        save_last_model=False,
+        best_file_name="best_model",
+        last_file_name="last_file",
+        callbacks=None,
+    ):
+        self.latent_space_dim = latent_space_dim
+        self.temporal_latent_space = temporal_latent_space
+        self.n_layers_encoder = n_layers_encoder
+        self.n_layers_decoder = n_layers_decoder
+        self.activation_encoder = activation_encoder
+        self.activation_decoder = activation_decoder
+        self.dilation_rate_encoder = dilation_rate_encoder
+        self.dilation_rate_decoder = dilation_rate_decoder
+        self.n_units_encoder = n_units_encoder
+        self.n_units_decoder = n_units_decoder
+        self.optimizer = optimizer
+        self.loss = loss
+        self.metrics = metrics
+        self.verbose = verbose
+        self.use_mini_batch_size = use_mini_batch_size
+        self.callbacks = callbacks
+        self.file_path = file_path
+        self.n_epochs = n_epochs
+        self.save_best_model = save_best_model
+        self.save_last_model = save_last_model
+        self.best_file_name = best_file_name
+        self.random_state = random_state
+
+        super().__init__(
+            n_clusters=n_clusters,
+            estimator=estimator,
+            clustering_algorithm=clustering_algorithm,
+            clustering_params=clustering_params,
+            batch_size=batch_size,
+            last_file_name=last_file_name,
+        )
+
+        self._network = AEDRNNNetwork(
+            latent_space_dim=self.latent_space_dim,
+            temporal_latent_space=self.temporal_latent_space,
+            n_layers_encoder=self.n_layers_encoder,
+            n_layers_decoder=self.n_layers_decoder,
+            dilation_rate_encoder=self.dilation_rate_encoder,
+            dilation_rate_decoder=self.dilation_rate_decoder,
+            activation_encoder=self.activation_encoder,
+            activation_decoder=self.activation_decoder,
+            n_units_encoder=self.n_units_encoder,
+            n_units_decoder=self.n_units_decoder,
+        )
+
+    def build_model(self, input_shape, **kwargs):
+        """Construct a compiled, un-trained, keras model that is ready for training.
+
+        In aeon, time series are stored in numpy arrays of shape
+        (n_channels,n_timepoints). Keras/tensorflow assume
+        data is in shape (n_timepoints,n_channels). This method also assumes
+        (n_timepoints,n_channels). Transpose should happen in fit.
+
+        Parameters
+        ----------
+        input_shape : tuple
+            The shape of the data fed into the input layer, should be
+            (n_timepoints,n_channels).
+
+        Returns
+        -------
+        output : a compiled Keras Model.
+        """
+        import numpy as np
+        import tensorflow as tf
+
+        rng = check_random_state(self.random_state)
+        self.random_state_ = rng.randint(0, np.iinfo(np.int32).max)
+        tf.keras.utils.set_random_seed(self.random_state_)
+        encoder, decoder = self._network.build_network(input_shape, **kwargs)
+
+        input_layer = tf.keras.layers.Input(input_shape, name="input layer")
+        encoder_output = encoder(input_layer)
+        decoder_output = decoder(encoder_output)
+        output_layer = tf.keras.layers.Reshape(
+            target_shape=input_shape, name="outputlayer"
+        )(decoder_output)
+
+        model = tf.keras.models.Model(inputs=input_layer, outputs=output_layer)
+
+        self.optimizer_ = (
+            tf.keras.optimizers.Adam() if self.optimizer is None else self.optimizer
+        )
+
+        if self.metrics is None:
+            self._metrics = ["mean_squared_error"]
+        elif isinstance(self.metrics, list):
+            self._metrics = self.metrics
+        elif isinstance(self.metrics, str):
+            self._metrics = [self.metrics]
+        else:
+            raise ValueError("Metrics should be a list, string, or None.")
+
+        model.compile(optimizer=self.optimizer_, loss=self.loss, metrics=self._metrics)
+
+        return model
+
+    def _fit(self, X):
+        """Fit the classifier on the training set (X, y).
+
+        Parameters
+        ----------
+        X : np.ndarray of shape = (n_cases (n), n_channels (d), n_timepoints (m))
+            The training input samples.
+
+        Returns
+        -------
+        self : object
+        """
+        import tensorflow as tf
+
+        # Transpose to conform to Keras input style.
+        X = X.transpose(0, 2, 1)
+
+        self.input_shape = X.shape[1:]
+        self.training_model_ = self.build_model(self.input_shape)
+
+        if self.verbose:
+            self.training_model_.summary()
+
+        if self.use_mini_batch_size:
+            mini_batch_size = min(self.batch_size, X.shape[0] // 10)
+        else:
+            mini_batch_size = self.batch_size
+
+        self.file_name_ = (
+            self.best_file_name if self.save_best_model else str(time.time_ns())
+        )
+
+        if self.callbacks is None:
+            self.callbacks_ = [
+                tf.keras.callbacks.ReduceLROnPlateau(
+                    monitor="loss", factor=0.5, patience=50, min_lr=0.0001
+                ),
+                tf.keras.callbacks.ModelCheckpoint(
+                    filepath=self.file_path + self.file_name_ + ".keras",
+                    monitor="loss",
+                    save_best_only=True,
+                ),
+            ]
+        else:
+            self.callbacks_ = self._get_model_checkpoint_callback(
+                callbacks=self.callbacks,
+                file_path=self.file_path,
+                file_name=self.file_name_,
+            )
+
+        self.history = self.training_model_.fit(
+            X,
+            X,
+            batch_size=mini_batch_size,
+            epochs=self.n_epochs,
+            verbose=self.verbose,
+            callbacks=self.callbacks_,
+        )
+
+        try:
+            self.model_ = tf.keras.models.load_model(
+                self.file_path + self.file_name_ + ".keras",
+                compile=False,
+                custom_objects={"_TensorDilation": _TensorDilation},
+            )
+            if not self.save_best_model:
+                os.remove(self.file_path + self.file_name_ + ".keras")
+        except FileNotFoundError:
+            self.model_ = deepcopy(self.training_model_)
+
+        self._fit_clustering(X=X)
+
+        gc.collect()
+
+        return self
+
+    def _score(self, X, y=None):
+        # Transpose to conform to Keras input style.
+        X = X.transpose(0, 2, 1)
+        latent_space = self.model_.layers[1].predict(X)
+        return self._estimator.score(latent_space)
+
+    @classmethod
+    def _get_test_params(cls, parameter_set="default"):
+        """Return testing parameter settings for the estimator.
+
+        Parameters
+        ----------
+        parameter_set : str, default="default"
+            Name of the set of test parameters to return, for use in tests. If no
+            special parameters are defined for a value, will return `"default"` set.
+            For classifiers, a "default" set of parameters should be provided for
+            general testing, and a "results_comparison" set for comparing against
+            previously recorded results if the general set does not produce suitable
+            probabilities to compare against.
+
+        Returns
+        -------
+        params : dict or list of dict, default={}
+            Parameters to create testing instances of the class.
+            Each dict are parameters to construct an "interesting" test instance, i.e.,
+            `MyClass(**params)` or `MyClass(**params[i])` creates a valid test instance.
+            `create_test_instance` uses the first (or only) dictionary in `params`.
+        """
+        param1 = {
+            "estimator": DummyClusterer(n_clusters=2),
+            "n_epochs": 1,
+            "batch_size": 4,
+            "n_layers_encoder": 1,
+            "n_layers_decoder": 1,
+        }
+
+        return [param1]