Source code for dtaianomaly.data.UCRLoader


import numpy as np
from dtaianomaly.data.data import LazyDataLoader, DataSet


[docs] class UCRLoader(LazyDataLoader): """ Lazy dataloader for the UCR suite of anomaly detection data sets. This implementation expects the file names to contain the start and stop time stamps of the single anomaly in the time series as: '\*_start_stop.txt'. Parameters ---------- path: str Path to a single UCR data set. """ def load(self) -> DataSet: # Load time series X = np.loadtxt(self.path) # Load anomaly targets (0 is background, 1 is anomaly) # UCR datasets specify the anomaly in dataset name name = self.path.split('_') onset = int(name[-2]) offset = int(''.join(filter(str.isdigit, name[-1]))) # To ensure the file extensions gets ignored y = np.zeros(shape=X.shape, dtype=np.int8) y[onset:offset] = 1 return DataSet(x=X, y=y)