Source code for dtaianomaly.preprocessing.MinMaxScaler

from typing import Optional, Tuple

import numpy as np
from sklearn.exceptions import NotFittedError

from dtaianomaly.preprocessing.Preprocessor import Preprocessor


[docs] class MinMaxScaler(Preprocessor): """ Rescale raw time series to a [0, 1] via min-max scaling. The minimum and maximum is computed on a training set, after which these values can be used to transform a new time series. Therefore, there is no guarantee that the values of the transformed test set will actually be in the range [0, 1]. For multivariate time series, each attribute will be normalized independently, i.e., the minimum and maximum of each attribute in the transformed time series will 0 and 1, respectively. If the minimum and maximum of an attribute is the same (the time series consists of only one value), then the transformation will not do anything. Attributes ---------- min_: array-like of shape (n_attributes) The minimum value in each attribute of the training data. max_: array-like of shape (n_attributes) The maximum value in each attribute of the training data. Raises ------ NotFittedError If the `transform` method is called before fitting this MinMaxScaler. """ min_: np.array max_: np.array def _fit(self, X: np.ndarray, y: Optional[np.ndarray] = None) -> "MinMaxScaler": if len(X.shape) == 1 or X.shape[1] == 1: # univariate case self.min_ = np.array([np.nanmin(X)]) self.max_ = np.array([np.nanmax(X)]) else: # multivariate case self.min_ = np.nanmin(X, axis=0) self.max_ = np.nanmax(X, axis=0) # Adjust to deal with constant attributes constant_attributes = self.min_ == self.max_ self.min_ = np.where(constant_attributes, 0, self.min_) self.max_ = np.where(constant_attributes, 1, self.max_) return self def _transform( self, X: np.ndarray, y: Optional[np.ndarray] = None ) -> Tuple[np.ndarray, Optional[np.ndarray]]: if not (hasattr(self, "min_") and hasattr(self, "max_")): raise NotFittedError(f"Call `fit` before using transform on {str(self)}") if not ( (len(X.shape) == 1 and self.min_.shape[0] == 1) or X.shape[1] == self.min_.shape[0] ): raise AttributeError( f"Trying to min max scale a time series with {X.shape[0]} attributes while it was fitted on {self.min_.shape[0]} attributes!" ) X_ = (X - self.min_) / (self.max_ - self.min_) return X_, y