From 6ca5bcd9588153c5cf0e9b1adf16fa06c914e91c Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 14 Jun 2024 12:21:29 +0300 Subject: [PATCH 01/43] metrics started --- fedot_ind/core/models/early_tc/metrics.py | 122 ++++++++++++++++++++++ fedot_ind/core/models/early_tc/teaser.py | 0 2 files changed, 122 insertions(+) create mode 100644 fedot_ind/core/models/early_tc/metrics.py create mode 100644 fedot_ind/core/models/early_tc/teaser.py diff --git a/fedot_ind/core/models/early_tc/metrics.py b/fedot_ind/core/models/early_tc/metrics.py new file mode 100644 index 000000000..a4cb9cef5 --- /dev/null +++ b/fedot_ind/core/models/early_tc/metrics.py @@ -0,0 +1,122 @@ +from sklearn.metrics import confusion_matrix +import numpy as np +import pandas as pd +from fedot.core.data.data import InputData, OutputData +from typing import Tuple, List, Optional, Union, Literal + +def conf_matrix(actual, predicted): + cm = confusion_matrix(actual, predicted) + return dict(TN=cm[0, 0], FP=cm[0, 1], FN=cm[1, 0], TP=[1, 1]) + +def average_delay(boundaries, prediction, + point, + use_idx=True, + window_placement='lefter'): + cp_confusion = extract_cp_cm(boundaries, prediction, use_idx=use_idx, use_switch_point=False) + # statistics + statistics = { + 'anomalies_num': len(cp_confusion['TPs']) + len(cp_confusion['FPs']), + 'FP_num': len(cp_confusion['FPs']), + 'missed': len(cp_confusion['FNs']) + } + time_func = { + 'righter': lambda triplet: triplet[1] - triplet[0], + 'lefter': lambda triplet: triplet[2] - triplet[1], + 'central': lambda triplet: triplet[1] - triplet[0] - (triplet[2] - triplet[0]) / 2 + }[window_placement] + + detection_history = { + i: time_func(triplet) for i, triplet in cp_confusion['TPs'].items() + } + return detection_history, statistics + + + +def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], + prediction: pd.DataFrame, + use_switch_point: bool = True, # if first anomaly dot is considered as changepoint + use_idx: bool = False): + if isinstance(boundaries, pd.DataFrame): + boundaries = boundaries.values.T + anomaly_tsp = prediction[prediction == 1].sort_index().index + TPs, FNs, FPs = {}, [], [] + + if boundaries.shape[1]: + + FPs += [anomaly_tsp[anomaly_tsp < boundaries[0, 0]]] # left rest + for i, (b_low, b_up) in enumerate(boundaries): + all_tsp_in_window = prediction[b_low: b_up].index + anomaly_tsp_in_window = anomaly_tsp_in_window & anomaly_tsp + if not len(anomaly_tsp_in_window): # why not false positive? do we expect an anomaly to be in every interval? + FNs.append(i if use_idx else all_tsp_in_window) + TPs[i] = [b_low, anomaly_tsp_in_window[int(use_switch_point)] if use_idx else anomaly_tsp_in_window, b_up] + if not use_idx: + FNs.append(all_tsp_in_window - anomaly_tsp_in_window) + FPs.append(anomaly_tsp[anomaly_tsp > boundaries[-1, -1]]) # right rest + else: + FPs.append(anomaly_tsp) + + FPs = np.concatenate(FPs) + FNs = np.concatenate(FNs) + + return dict( + FP=FPs, + FN=FNs, + TP=TPs + ) + + +# cognate of single_detecting_boundaries +def get_boundaries(idx, actual_timestamps, window_size:int = None, + window_placement: Literal['left', 'right', 'central'] = 'left', + intersection_mode: Literal['uniform', 'shift_to_left', 'shift_to_right'] = 'shift_to_left', + ): + # idx = idx + # cast everything to pandas object fir the subsequent comfort + if isinstance(idx, np.array): + if idx.dtype == np.dtype('O'): + idx = pd.to_datetime(pd.Series(idx)) + td = pd.Timedelta(window_size) + else: + idx = pd.Series(idx) + td = window_size + else: + raise TypeError('Unexpected type of ts index') + + boundaries = np.tile(actual_timestamps, (2, 1)) + # [0, ...] - lower bound, [1, ...] - upper + if window_placement == 'left': + boundaries[0] -= td + elif window_placement == 'central': + boundaries[0] -= td / 2 + boundaries[1] += td / 2 + elif window_placement == 'right': + boundaries[1] += td + else: + raise ValueError('Unknown mode') + + if not len(actual_timestamps): + return boundaries + + # intersection resolution + for i in range(len(actual_timestamps) - 1): + if not boundaries[0, i + 1] > boundaries[1, i]: + continue + + if intersection_mode == 'shift_to_left': + boundaries[0, i + 1] = boundaries[1, i] + elif intersection_mode == 'shift_to_right': + boundaries[1, i] = boundaries[0, i + 1] + elif intersection_mode == 'uniform': + boundaries[1, i], boundaries[0, i + 1] = boundaries[0, i + 1], boundaries[1, i] + else: + raise ValueError('Unknown intersection resolution') + + # filtering + idx_to_keep = np.abs(np.diff(boundaries, axis=0)) > 1e-6 + boundaries = boundaries[..., idx_to_keep] + boundaries = pd.DataFrame({'lower': boundaries[0], 'upper': boundaries[1]}) + return boundaries + + + diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py new file mode 100644 index 000000000..e69de29bb From e69fcd4ba6baa10dd02585333a052badf15f8a39 Mon Sep 17 00:00:00 2001 From: leostre Date: Thu, 20 Jun 2024 13:17:30 +0300 Subject: [PATCH 02/43] metrics ended --- fedot_ind/core/models/early_tc/metrics.py | 26 ++++++++++++++++++----- 1 file changed, 21 insertions(+), 5 deletions(-) diff --git a/fedot_ind/core/models/early_tc/metrics.py b/fedot_ind/core/models/early_tc/metrics.py index a4cb9cef5..f4a5f6544 100644 --- a/fedot_ind/core/models/early_tc/metrics.py +++ b/fedot_ind/core/models/early_tc/metrics.py @@ -30,7 +30,8 @@ def average_delay(boundaries, prediction, } return detection_history, statistics - +def tp_transform(tps): + return np.diff(tps[[1, 0]], axis=0) / np.diff(tps[[-1, 0]], axis=0) def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], prediction: pd.DataFrame, @@ -49,7 +50,9 @@ def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], anomaly_tsp_in_window = anomaly_tsp_in_window & anomaly_tsp if not len(anomaly_tsp_in_window): # why not false positive? do we expect an anomaly to be in every interval? FNs.append(i if use_idx else all_tsp_in_window) - TPs[i] = [b_low, anomaly_tsp_in_window[int(use_switch_point)] if use_idx else anomaly_tsp_in_window, b_up] + TPs[i] = [b_low, + anomaly_tsp_in_window[int(use_switch_point)] if use_idx else anomaly_tsp_in_window, + b_up] if not use_idx: FNs.append(all_tsp_in_window - anomaly_tsp_in_window) FPs.append(anomaly_tsp[anomaly_tsp > boundaries[-1, -1]]) # right rest @@ -62,10 +65,9 @@ def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], return dict( FP=FPs, FN=FNs, - TP=TPs + TP=np.stack(TPs) ) - # cognate of single_detecting_boundaries def get_boundaries(idx, actual_timestamps, window_size:int = None, window_placement: Literal['left', 'right', 'central'] = 'left', @@ -118,5 +120,19 @@ def get_boundaries(idx, actual_timestamps, window_size:int = None, boundaries = pd.DataFrame({'lower': boundaries[0], 'upper': boundaries[1]}) return boundaries - +def nab(boundaries, predictions, mode='standard', custom_coefs=None): + inner_coefs = { + 'low_FP': [1.0, -0.11, -1.0], + 'standard': [1., -0.22, -1.], + 'lof_FN': [1., -0.11, -2.] + } + coefs = custom_coefs or inner_coefs[mode] + confusion_matrix = extract_cp_cm(boundaries, predictions) + + tps = confusion_matrix['tps'] + + score = np.inner([tps, len(confusion_matrix['FP']), len(confusion_matrix['FN'])], + coefs) + return score + From bc4064df91209922c9c39bc5c46f2db7d6cb4b09 Mon Sep 17 00:00:00 2001 From: leostre Date: Mon, 24 Jun 2024 03:05:51 +0300 Subject: [PATCH 03/43] in basis teaser is completed, need some make-up and add cut ts support --- fedot_ind/core/metrics/interval_metrics.py | 138 +++++++++++++++++++++ fedot_ind/core/models/early_tc/teaser.py | 123 ++++++++++++++++++ 2 files changed, 261 insertions(+) create mode 100644 fedot_ind/core/metrics/interval_metrics.py diff --git a/fedot_ind/core/metrics/interval_metrics.py b/fedot_ind/core/metrics/interval_metrics.py new file mode 100644 index 000000000..f4a5f6544 --- /dev/null +++ b/fedot_ind/core/metrics/interval_metrics.py @@ -0,0 +1,138 @@ +from sklearn.metrics import confusion_matrix +import numpy as np +import pandas as pd +from fedot.core.data.data import InputData, OutputData +from typing import Tuple, List, Optional, Union, Literal + +def conf_matrix(actual, predicted): + cm = confusion_matrix(actual, predicted) + return dict(TN=cm[0, 0], FP=cm[0, 1], FN=cm[1, 0], TP=[1, 1]) + +def average_delay(boundaries, prediction, + point, + use_idx=True, + window_placement='lefter'): + cp_confusion = extract_cp_cm(boundaries, prediction, use_idx=use_idx, use_switch_point=False) + # statistics + statistics = { + 'anomalies_num': len(cp_confusion['TPs']) + len(cp_confusion['FPs']), + 'FP_num': len(cp_confusion['FPs']), + 'missed': len(cp_confusion['FNs']) + } + time_func = { + 'righter': lambda triplet: triplet[1] - triplet[0], + 'lefter': lambda triplet: triplet[2] - triplet[1], + 'central': lambda triplet: triplet[1] - triplet[0] - (triplet[2] - triplet[0]) / 2 + }[window_placement] + + detection_history = { + i: time_func(triplet) for i, triplet in cp_confusion['TPs'].items() + } + return detection_history, statistics + +def tp_transform(tps): + return np.diff(tps[[1, 0]], axis=0) / np.diff(tps[[-1, 0]], axis=0) + +def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], + prediction: pd.DataFrame, + use_switch_point: bool = True, # if first anomaly dot is considered as changepoint + use_idx: bool = False): + if isinstance(boundaries, pd.DataFrame): + boundaries = boundaries.values.T + anomaly_tsp = prediction[prediction == 1].sort_index().index + TPs, FNs, FPs = {}, [], [] + + if boundaries.shape[1]: + + FPs += [anomaly_tsp[anomaly_tsp < boundaries[0, 0]]] # left rest + for i, (b_low, b_up) in enumerate(boundaries): + all_tsp_in_window = prediction[b_low: b_up].index + anomaly_tsp_in_window = anomaly_tsp_in_window & anomaly_tsp + if not len(anomaly_tsp_in_window): # why not false positive? do we expect an anomaly to be in every interval? + FNs.append(i if use_idx else all_tsp_in_window) + TPs[i] = [b_low, + anomaly_tsp_in_window[int(use_switch_point)] if use_idx else anomaly_tsp_in_window, + b_up] + if not use_idx: + FNs.append(all_tsp_in_window - anomaly_tsp_in_window) + FPs.append(anomaly_tsp[anomaly_tsp > boundaries[-1, -1]]) # right rest + else: + FPs.append(anomaly_tsp) + + FPs = np.concatenate(FPs) + FNs = np.concatenate(FNs) + + return dict( + FP=FPs, + FN=FNs, + TP=np.stack(TPs) + ) + +# cognate of single_detecting_boundaries +def get_boundaries(idx, actual_timestamps, window_size:int = None, + window_placement: Literal['left', 'right', 'central'] = 'left', + intersection_mode: Literal['uniform', 'shift_to_left', 'shift_to_right'] = 'shift_to_left', + ): + # idx = idx + # cast everything to pandas object fir the subsequent comfort + if isinstance(idx, np.array): + if idx.dtype == np.dtype('O'): + idx = pd.to_datetime(pd.Series(idx)) + td = pd.Timedelta(window_size) + else: + idx = pd.Series(idx) + td = window_size + else: + raise TypeError('Unexpected type of ts index') + + boundaries = np.tile(actual_timestamps, (2, 1)) + # [0, ...] - lower bound, [1, ...] - upper + if window_placement == 'left': + boundaries[0] -= td + elif window_placement == 'central': + boundaries[0] -= td / 2 + boundaries[1] += td / 2 + elif window_placement == 'right': + boundaries[1] += td + else: + raise ValueError('Unknown mode') + + if not len(actual_timestamps): + return boundaries + + # intersection resolution + for i in range(len(actual_timestamps) - 1): + if not boundaries[0, i + 1] > boundaries[1, i]: + continue + + if intersection_mode == 'shift_to_left': + boundaries[0, i + 1] = boundaries[1, i] + elif intersection_mode == 'shift_to_right': + boundaries[1, i] = boundaries[0, i + 1] + elif intersection_mode == 'uniform': + boundaries[1, i], boundaries[0, i + 1] = boundaries[0, i + 1], boundaries[1, i] + else: + raise ValueError('Unknown intersection resolution') + + # filtering + idx_to_keep = np.abs(np.diff(boundaries, axis=0)) > 1e-6 + boundaries = boundaries[..., idx_to_keep] + boundaries = pd.DataFrame({'lower': boundaries[0], 'upper': boundaries[1]}) + return boundaries + +def nab(boundaries, predictions, mode='standard', custom_coefs=None): + inner_coefs = { + 'low_FP': [1.0, -0.11, -1.0], + 'standard': [1., -0.22, -1.], + 'lof_FN': [1., -0.11, -2.] + } + coefs = custom_coefs or inner_coefs[mode] + confusion_matrix = extract_cp_cm(boundaries, predictions) + + tps = confusion_matrix['tps'] + + score = np.inner([tps, len(confusion_matrix['FP']), len(confusion_matrix['FN'])], + coefs) + return score + + diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index e69de29bb..66dc88745 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -0,0 +1,123 @@ +from typing import Union, List, Optional +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot.core.data.data import InputData, OutputData +from sklearn.svm import OneClassSVM +from sklearn.preprocessing import StandardScaler +from sktime.classification.dictionary_based import MUSE, WEASEL +from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation +from fedot.core.operations.operation_parameters import OperationParameters + + +class TEASER(ModelImplementation): + def __init__(self, params: Optional[OperationParameters] = None): + super().__init__() + if params is None: + params = {} + self.interval_length = params.get('interval_length', 10) # rewrite as interval_length + self.acceptance_threshold = params.get('acceptance_threshold', 5) + self.hm_shift_to_acc = params.get('hm_shift_to_acc', 1.) + assert self.acceptance_threshold < self.interval_length, 'Not enough checkpoints for prediction proof' + # how to pass into ? % what needed + self.oc_svm_params = {} + self.weasel_params = {} + self.random_state = None # is needed? + + def _init_model(self, max_data_length): + self.prediction_idx = self._compute_prediction_points(max_data_length) + self.n_pred = len(self.prediction_idx) + self.oc_estimators = [OneClassSVM(**self.oc_svm_params) for _ in range(self.n_pred)] + self.slave_estimators = [WEASEL(random_state=self.random_state, support_probabilities=True, **self.weasel_params) for _ in range(self.n_pred)] + self.scalers = [StandardScaler() for _ in range(self.n_pred)] # do we need them separate? no inverse path expected + + def fit(self, input_data: InputData): + input_data = self.__convert_pd(input_data) + X, y = input_data.features, input_data.target # what's passed in case of classification to training? + self._init_model(max_data_length=X.shape[-1]) + for i in range(self.n_pred): + self._fit_one_interval(X, y, i) + + def _fit_one_interval(self, X, y, i): + X_part = X[..., :self.prediction_idx[i]] # what's dimensionality of input? will it work in case of multivariate? + X_part = self.scalers[i].fit_transform(X_part) + probas = self.slave_estimators[i].fit_predict_proba(X_part, y) + filtered_probas = self._filter_positive(probas, y) # + X_oc = self._form_X_oc(filtered_probas) + self.oc_estimators[i].fit(X_oc, y) + + def _predict_one_slave(self, X, i): + X_part = X[..., :self.prediction_idx[i]] + X_part = self.scalers[i].transform(X_part) + probas = self.slave_estimators[i].predict_proba(X_part) + X_oc = self._form_X_oc(probas) + return X_oc, np.argmax(probas, axis=-1) + + def _compute_prediction_points(self, n_idx): + """Computes indices for prediction, includes last index, first interval may be greater""" + prediction_idx = np.arange(n_idx - 1, -1, -self.interval_length)[::-1] + self.earliness = 1 - prediction_idx / n_idx + return prediction_idx + + def _filter_positive(self, predicted_probas, y): # different logic in sktime + predicted_labels = np.argmax(predicted_probas, axis=-1).flatten() + return predicted_probas[predicted_labels == y] + + def _form_X_oc(self, predicted_probas): + d = (predicted_probas.max() - predicted_probas) + d[d == 0] = 1 + d = d.min(axis=-1).reshape(-1, 1) + return np.hstack([predicted_probas, d]) + + def _predict(self, X): + n = X.shape[0] + self.states = np.ones((n, self.n_pred, 2)) # num_consec, class + X_ocs, predicted_labels = zip( + *[self._predict_one_slave(X, i) for i in range(self.n_pred)] + ) + non_acceptance = self._consecutive_count(predicted_labels) < self.acceptance_threshold + to_oc_check = np.argwhere(non_acceptance) + X_ocs = np.stack(X_ocs) + predicted_labels = np.stack(predicted_labels) + # for each point of estimation + for i in range(self.n_pred): + # find not accepted points + ith_point_to_oc = to_oc_check[to_oc_check[:, 0] == i, 1] + X_to_ith = X_ocs[i][ith_point_to_oc] + # if they are not outliers + final_verdict = self.oc_estimators[i].predict(X_to_ith) # 1 for accept -1 for reject + # mark as accepted + non_acceptance[i, np.argwhere(final_verdict == 1).flatten()] = False + predicted_labels[non_acceptance] = -1 + return predicted_labels + + def _consecutive_count(self, predicted_labels: List[np.array]): + n = len(predicted_labels[0]) + consecutive_labels = np.ones((self.n_pred, n)) + for i in range(1, self.n_pred): + equal = predicted_labels[i - 1] == predicted_labels[i] + consecutive_labels[i, equal] = consecutive_labels[i - 1, equal] + 1 + return consecutive_labels # n_pred x n_instances + + def __convert_pd(self, input_data): + if hasattr(input_data.features, 'values'): + input_data.features = input_data.features.values + if hasattr(input_data.target, 'values'): + input_data.target = input_data.target.values + return input_data + + def predict(self, input_data: InputData) -> OutputData: + input_data = self.__convert_pd(input_data) + prediction = self._predict(input_data.features) + return self._convert_to_output(input_data, predict=prediction) + + def predict_for_fit(self, input_data: InputData) -> OutputData: + return self.predict(input_data) + + def _score(self, X, y, hm_shift_to_acc=None): + hm_shift_to_acc = hm_shift_to_acc or self.hm_shift_to_acc + predictions = self._predict(X) + accuracies = (predictions == np.tile(y, (1, self.n_pred))).sum(axis=1) / len(y) + return (1 + hm_shift_to_acc) * accuracies * self.earliness / (hm_shift_to_acc * accuracies + self.earliness) + + def _tune_oc(self): + #TODO + pass From 6500db70edcb3f068ff1c2d292258ab89ab4767b Mon Sep 17 00:00:00 2001 From: leostre Date: Wed, 26 Jun 2024 17:09:09 +0300 Subject: [PATCH 04/43] teaser inherits sklearn's classifier mixin now --- fedot_ind/core/models/early_tc/__init__.py | 0 fedot_ind/core/models/early_tc/teaser.py | 61 +++++++++++++------ .../data/default_operation_params.json | 37 +++++------ .../data/industrial_model_repository.json | 11 ++++ fedot_ind/core/repository/model_repository.py | 5 +- fedot_ind/core/tuning/search_space.py | 24 ++++++++ tests/unit/core/models/test_teaser.py | 35 +++++++++++ 7 files changed, 130 insertions(+), 43 deletions(-) create mode 100644 fedot_ind/core/models/early_tc/__init__.py create mode 100644 tests/unit/core/models/test_teaser.py diff --git a/fedot_ind/core/models/early_tc/__init__.py b/fedot_ind/core/models/early_tc/__init__.py new file mode 100644 index 000000000..e69de29bb diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 66dc88745..66a031fd4 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -3,6 +3,7 @@ from fedot.core.data.data import InputData, OutputData from sklearn.svm import OneClassSVM from sklearn.preprocessing import StandardScaler +from sklearn.model_selection import GridSearchCV from sktime.classification.dictionary_based import MUSE, WEASEL from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation from fedot.core.operations.operation_parameters import OperationParameters @@ -13,21 +14,25 @@ def __init__(self, params: Optional[OperationParameters] = None): super().__init__() if params is None: params = {} + self.prediction_mode = params.get('prediction_mode', 'best_by_harmonic_mean') self.interval_length = params.get('interval_length', 10) # rewrite as interval_length self.acceptance_threshold = params.get('acceptance_threshold', 5) self.hm_shift_to_acc = params.get('hm_shift_to_acc', 1.) assert self.acceptance_threshold < self.interval_length, 'Not enough checkpoints for prediction proof' + # how to pass into ? % what needed - self.oc_svm_params = {} + self._oc_svm_params = [100, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1.5, 1] self.weasel_params = {} self.random_state = None # is needed? def _init_model(self, max_data_length): self.prediction_idx = self._compute_prediction_points(max_data_length) self.n_pred = len(self.prediction_idx) - self.oc_estimators = [OneClassSVM(**self.oc_svm_params) for _ in range(self.n_pred)] + self.oc_estimators = [None] * self.n_pred self.slave_estimators = [WEASEL(random_state=self.random_state, support_probabilities=True, **self.weasel_params) for _ in range(self.n_pred)] - self.scalers = [StandardScaler() for _ in range(self.n_pred)] # do we need them separate? no inverse path expected + self.scalers = [StandardScaler() for _ in range(self.n_pred)] + self.__offset = max_data_length % self.interval_length + self.best_estimator_idx = -1 def fit(self, input_data: InputData): input_data = self.__convert_pd(input_data) @@ -35,17 +40,22 @@ def fit(self, input_data: InputData): self._init_model(max_data_length=X.shape[-1]) for i in range(self.n_pred): self._fit_one_interval(X, y, i) + self.best_estimator_idx = np.argmax(self._score(X, y, self.hm_shift_to_acc)) def _fit_one_interval(self, X, y, i): - X_part = X[..., :self.prediction_idx[i]] # what's dimensionality of input? will it work in case of multivariate? + X_part = X[..., :self.prediction_idx[i] + 1] # what's dimensionality of input? will it work in case of multivariate? X_part = self.scalers[i].fit_transform(X_part) probas = self.slave_estimators[i].fit_predict_proba(X_part, y) - filtered_probas = self._filter_positive(probas, y) # + filtered_probas = self._filter_trues(probas, y) # X_oc = self._form_X_oc(filtered_probas) - self.oc_estimators[i].fit(X_oc, y) + self.oc_estimators[i] = GridSearchCV(OneClassSVM(), + param_grid={"gamma": self._oc_svm_params}, + scoring='accuracy', + cv=min(X.shape[0], 10) + ).fit(X_oc, np.ones((len(X_oc), 1))).best_estimator_ - def _predict_one_slave(self, X, i): - X_part = X[..., :self.prediction_idx[i]] + def _predict_one_slave(self, X, i, offset=0): + X_part = X[..., max(0, offset - 1):self.prediction_idx[i] + 1] X_part = self.scalers[i].transform(X_part) probas = self.slave_estimators[i].predict_proba(X_part) X_oc = self._form_X_oc(probas) @@ -57,7 +67,7 @@ def _compute_prediction_points(self, n_idx): self.earliness = 1 - prediction_idx / n_idx return prediction_idx - def _filter_positive(self, predicted_probas, y): # different logic in sktime + def _filter_trues(self, predicted_probas, y): # different logic in sktime predicted_labels = np.argmax(predicted_probas, axis=-1).flatten() return predicted_probas[predicted_labels == y] @@ -70,15 +80,20 @@ def _form_X_oc(self, predicted_probas): def _predict(self, X): n = X.shape[0] self.states = np.ones((n, self.n_pred, 2)) # num_consec, class + if self.prediction_mode == 'best_by_harmonic_mean': + estimator_indices = [self.best_estimator_idx] + else: + last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) + estimator_indices = list(range(last_idx + 1)) X_ocs, predicted_labels = zip( - *[self._predict_one_slave(X, i) for i in range(self.n_pred)] + *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary ) non_acceptance = self._consecutive_count(predicted_labels) < self.acceptance_threshold to_oc_check = np.argwhere(non_acceptance) X_ocs = np.stack(X_ocs) predicted_labels = np.stack(predicted_labels) # for each point of estimation - for i in range(self.n_pred): + for i in range(predicted_labels.shape[0]): # find not accepted points ith_point_to_oc = to_oc_check[to_oc_check[:, 0] == i, 1] X_to_ith = X_ocs[i][ith_point_to_oc] @@ -87,15 +102,16 @@ def _predict(self, X): # mark as accepted non_acceptance[i, np.argwhere(final_verdict == 1).flatten()] = False predicted_labels[non_acceptance] = -1 - return predicted_labels + return predicted_labels # prediction_points x n_instances def _consecutive_count(self, predicted_labels: List[np.array]): n = len(predicted_labels[0]) - consecutive_labels = np.ones((self.n_pred, n)) - for i in range(1, self.n_pred): + prediction_points = len(predicted_labels) + consecutive_labels = np.ones((prediction_points, n)) + for i in range(1, prediction_points): equal = predicted_labels[i - 1] == predicted_labels[i] consecutive_labels[i, equal] = consecutive_labels[i - 1, equal] + 1 - return consecutive_labels # n_pred x n_instances + return consecutive_labels # prediction_points x n_instances def __convert_pd(self, input_data): if hasattr(input_data.features, 'values'): @@ -115,9 +131,14 @@ def predict_for_fit(self, input_data: InputData) -> OutputData: def _score(self, X, y, hm_shift_to_acc=None): hm_shift_to_acc = hm_shift_to_acc or self.hm_shift_to_acc predictions = self._predict(X) - accuracies = (predictions == np.tile(y, (1, self.n_pred))).sum(axis=1) / len(y) - return (1 + hm_shift_to_acc) * accuracies * self.earliness / (hm_shift_to_acc * accuracies + self.earliness) + prediction_points = predictions.shape[0] + accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) + return (1 + hm_shift_to_acc) * accuracies * self.earliness[:prediction_points] / (hm_shift_to_acc * accuracies + self.earliness[:prediction_points]) - def _tune_oc(self): - #TODO - pass + def _get_applicable_index(self, last_available_idx): + idx = np.searchsorted(self.prediction_idx, last_available_idx, side='right') + if idx == 0: + raise RuntimeError('Too few points for prediction!') + idx -= 1 + offset = last_available_idx - self.prediction_idx[idx] + return idx, offset diff --git a/fedot_ind/core/repository/data/default_operation_params.json b/fedot_ind/core/repository/data/default_operation_params.json index ac513600e..1bbcc8614 100644 --- a/fedot_ind/core/repository/data/default_operation_params.json +++ b/fedot_ind/core/repository/data/default_operation_params.json @@ -31,6 +31,10 @@ "activation": "Softmax", "num_classes": 1 }, + "deepar_model": { + "epochs": 100, + "batch_size": 16 + }, "inception_model": { "epochs": 100, "batch_size": 32, @@ -43,6 +47,11 @@ "activation": "Softmax", "model_name": "ResNet18" }, + "tcn_model": { + "epochs": 100, + "batch_size": 32, + "activation": "ReLU" + }, "ssa_forecaster": { "window_size_method": "hac", "history_lookback": 30 @@ -121,6 +130,11 @@ "min_samples_leaf": 10, "bootstrap": false }, + "teaser": { + "interval_length": 10, + "acceptance_threshold": 3, + "hm_shift_to_acc": 2 + }, "dt": { "max_depth": 5, "min_samples_split": 10, @@ -344,27 +358,6 @@ "timeout": 10, "with_tuning": true }, -<<<<<<< HEAD - "minirocket_extractor": { - "num_features": 10000 - }, - "chronos_extractor": { - "num_features": 10000 - }, - "inception_model": { - "epochs": 100, - "batch_size": 32 - }, - "omniscale_model": { - "epochs": 100, - "batch_size": 32 - }, - "deepar_model": { - "epochs": 100, - "batch_size": 16 - }, -======= ->>>>>>> c5c358ba8f9b87b626014d2da9b2135c82684258 "tst_model": { "epochs": 100, "batch_size": 32 @@ -402,4 +395,4 @@ "max_homology_dimension": 1, "metric": "euclidean" } -} \ No newline at end of file +} diff --git a/fedot_ind/core/repository/data/industrial_model_repository.json b/fedot_ind/core/repository/data/industrial_model_repository.json index 3f5c0a10f..8fb12f6de 100644 --- a/fedot_ind/core/repository/data/industrial_model_repository.json +++ b/fedot_ind/core/repository/data/industrial_model_repository.json @@ -617,6 +617,17 @@ "non_linear" ] }, + "teaser": { + "meta": "ts_model", + "presets": ["fast_train", "ts"], + "tags": [ + "simple", + "interpretable", + "non_lagged", + "non_linear" + ], + "input_type": "[DataTypesEnum.ts]" + }, "xgboost": { "meta": "sklearn_class", "presets": ["*tree"], diff --git a/fedot_ind/core/repository/model_repository.py b/fedot_ind/core/repository/model_repository.py index 69e47be3d..a984cbd38 100644 --- a/fedot_ind/core/repository/model_repository.py +++ b/fedot_ind/core/repository/model_repository.py @@ -44,6 +44,7 @@ from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor from xgboost import XGBRegressor +from fedot_ind.core.models.early_tc.teaser import TEASER from fedot_ind.core.models.manifold.riemann_embeding import RiemannExtractor from fedot_ind.core.models.nn.network_impl.dummy_nn import DummyOverComplicatedNeuralNetwork from fedot_ind.core.models.nn.network_impl.deepar import DeepAR @@ -132,7 +133,9 @@ class AtomizedModel(Enum): # solo nn models 'mlp': MLPClassifier, # external models - 'lgbm': LGBMClassifier + 'lgbm': LGBMClassifier, + # Early classification + 'teaser': TEASER } FEDOT_PREPROC_MODEL = { # data standartization diff --git a/fedot_ind/core/tuning/search_space.py b/fedot_ind/core/tuning/search_space.py index 82e798059..37849840d 100644 --- a/fedot_ind/core/tuning/search_space.py +++ b/fedot_ind/core/tuning/search_space.py @@ -60,6 +60,30 @@ 'selection_strategy': {'hyperopt-dist': hp.choice, 'sampling-scope': [['sum', 'pairwise']]} }, + 'teaser': + {'interval_percentage': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[5, 10, 20, 25]]}, + 'acceptance_threshold': {'hyperopt-dist': hp.choice, + 'sampling_scope': [[1, 2, 3, 4, 5]]}, + 'hm_shift_to_acc': {'hyperopt-dist': hp.choice, + 'sampling-scope': [0.01, 0.1, 0.5, 1, 5, 10, 100]}, + }, + 'deepar_model': + {'epochs': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[x for x in range(10, 100, 10)]]}, + 'batch_size': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[x for x in range(8, 64, 6)]]}, + 'dropout': {'hyperopt-dist': hp.choice, + 'sampling-scope': [list(range(0, 0.6, 0.1))]}, + 'rnn_layers':{'hyperopt-dist': hp.choice, + 'sampling-scope': [range(1, 6)]}, + 'hidden_size':{'hyperopt-dist': hp.choice, + 'sampling-scope': [list(range(10, 101, 10))]}, + 'cell_type':{'hyperopt-dist': hp.choice, + 'sampling-scope': [['GRU', 'LSTM', 'RNN']]}, + 'expected_distribution': {'hyperopt-dist': hp.choice, + 'sampling-scope': [['normal', 'cauchy']]} + }, 'patch_tst_model': {'epochs': {'hyperopt-dist': hp.choice, 'sampling-scope': [[x for x in range(10, 100, 10)]]}, 'batch_size': {'hyperopt-dist': hp.choice, 'sampling-scope': [[x for x in range(8, 64, 6)]]}, diff --git a/tests/unit/core/models/test_teaser.py b/tests/unit/core/models/test_teaser.py new file mode 100644 index 000000000..2bc19b8de --- /dev/null +++ b/tests/unit/core/models/test_teaser.py @@ -0,0 +1,35 @@ +import pytest +import numpy as np +from fedot_ind.core.models.early_tc import teaser as TEASER + + +@pytest.fixture(scope='module') +def teaser(): + teaser = TEASER.TEASER({'interval_length': 10, 'prediction_mode': ''}) + return teaser + +@pytest.fixture(scope='module') +def xy(): + return np.random.randn((2, 23)), np.random.randint(0, 2, size=(2, 1)) + +def test_get_applicable_index(teaser): + teaser._init_model(23) + idx, offset = teaser._get_last_applicable_idx(100) + assert offset == 100 - 22, 'Wrong offset estimation when right edge' + assert idx == len(teaser.prediction_idx) - 1 + idx, offset = teaser._get_last_applicable_idx(12) + assert offset == 100 - teaser.prediction_idx[idx], 'Wrong offset estimation in the middle' + assert idx == len(teaser.prediction_idx) - 1 + +def test_compute_prediction_points(teaser): + indices = teaser._compute_prediction_points(23) + assert 2 in indices + assert 22 in indices + assert 23 not in indices + +# def test_consecutive_count(teaser): +# pass + +# def test_score(teaser): + + From 4204d6a259192c5f67a4fbde023cb651f7858d34 Mon Sep 17 00:00:00 2001 From: leostre Date: Thu, 27 Jun 2024 18:22:34 +0300 Subject: [PATCH 05/43] class tree reconf. added proba_thresholding classifier (not registered) --- .../core/models/early_tc/base_early_tc.py | 115 +++++++++++++++++ .../core/models/early_tc/prob_threshold.py | 48 +++++++ fedot_ind/core/models/early_tc/teaser.py | 119 +++++------------- 3 files changed, 193 insertions(+), 89 deletions(-) create mode 100644 fedot_ind/core/models/early_tc/base_early_tc.py create mode 100644 fedot_ind/core/models/early_tc/prob_threshold.py diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py new file mode 100644 index 000000000..094d895c3 --- /dev/null +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -0,0 +1,115 @@ +from typing import Union, List, Optional +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data +from fedot.core.data.data import InputData, OutputData +from sklearn.svm import OneClassSVM +from sklearn.preprocessing import StandardScaler +from sklearn.model_selection import GridSearchCV +from sklearn.base import ClassifierMixin, BaseEstimator +from sktime.classification.dictionary_based import MUSE, WEASEL +from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation +from fedot.core.operations.operation_parameters import OperationParameters +from fedot.core.repository.dataset_types import DataTypesEnum +from fedot.core.repository.tasks import Task, TaskTypesEnum + + +class BaseETC(ClassifierMixin, BaseEstimator): + def __init__(self, params: Optional[OperationParameters] = None): + if params is None: + params = {} + super().__init__() + self.prediction_mode = params.get('prediction_mode', 'best_by_harmonic_mean') + self.interval_percentage = params.get('interval_percentage', 10) # rewrite as interval_length + self.acceptance_threshold = params.get('acceptance_threshold', 5) + self.hm_shift_to_acc = params.get('hm_shift_to_acc', 1.) + assert self.acceptance_threshold < self.interval_percentage, 'Not enough checkpoints for prediction proof' + + def _init_model(self, X, y): + max_data_length = X.shape[-1] + self.prediction_idx = self._compute_prediction_points(max_data_length) + self.n_pred = len(self.prediction_idx) + self.slave_estimators = [WEASEL(random_state=self.random_state, support_probabilities=True, **self.weasel_params) for _ in range(self.n_pred)] + self.scalers = [StandardScaler() for _ in range(self.n_pred)] + self._best_estimator_idx = -1 + self.classes_ = [[-1, *np.unique(y)]] + + @property + def required_length(self): + if not hasattr(self, '_best_estimator_idx'): + return None + return self.prediction_idx[self._best_estimator_idx] + + def fit(self, X, y=None): + assert y is not None, 'Pass y' + y = np.array(y).flatten() + self._init_model(X, y) + for i in range(self.n_pred): + self._fit_one_interval(X, y, i) + self._best_estimator_idx = np.argmax(self._score(X, y, self.hm_shift_to_acc)) + + def _fit_one_interval(self, X, y, i): + X_part = X[..., :self.prediction_idx[i] + 1] # what's dimensionality of input? will it work in case of multivariate? + X_part = self.scalers[i].fit_transform(X_part) + probas = self.slave_estimators[i].fit_predict_proba(X_part, y) + return probas + + def _predict_one_slave(self, X, i, offset=0): + X_part = X[..., max(0, offset - 1):self.prediction_idx[i] + 1] + X_part = self.scalers[i].transform(X_part) + probas = self.slave_estimators[i].predict_proba(X_part) + return probas, np.argmax(probas, axis=-1) + + def _compute_prediction_points(self, n_idx): + interval_length = int(n_idx * self.interval_percentage / 100) + prediction_idx = np.arange(n_idx - 1, -1, -interval_length)[::-1] + self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 + return prediction_idx + + def _select_estimators(self, X): + offset = 0 + if self.prediction_mode == 'best_by_harmonic_mean': + estimator_indices = [self._best_estimator_idx] + elif self.prediction_mode == 'all': + last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) + estimator_indices = np.arange(last_idx + 1) + else: + raise ValueError('Unknown prediction mode') + return estimator_indices, offset + + def _predict(self, X,): + estimator_indices, offset = self._select_estimators(X) + predicted_probas, predicted_labels = zip( + *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary + ) + return predicted_labels, predicted_probas + + def _consecutive_count(self, predicted_labels: List[np.array]): + n = len(predicted_labels[0]) + prediction_points = len(predicted_labels) + consecutive_labels = np.ones((prediction_points, n)) + for i in range(1, prediction_points): + equal = predicted_labels[i - 1] == predicted_labels[i] + consecutive_labels[i, equal] = consecutive_labels[i - 1, equal] + 1 + return consecutive_labels # prediction_points x n_instances + + def predict_proba(self, X): + raise NotImplementedError + + def predict(self, X): + raise NotImplementedError + + def _score(self, X, y, hm_shift_to_acc=None): + y = np.array(y).flatten() + hm_shift_to_acc = hm_shift_to_acc or self.hm_shift_to_acc + predictions, *_ = self._predict(X) + prediction_points = predictions.shape[0] + accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) + return (1 + hm_shift_to_acc) * accuracies * self.earliness[:prediction_points] / (hm_shift_to_acc * accuracies + self.earliness[:prediction_points]) + + def _get_applicable_index(self, last_available_idx): + idx = np.searchsorted(self.prediction_idx, last_available_idx, side='right') + if idx == 0: + raise RuntimeError('Too few points for prediction!') + idx -= 1 + offset = last_available_idx - self.prediction_idx[idx] + return idx, offset diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py new file mode 100644 index 000000000..6e9c487c1 --- /dev/null +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -0,0 +1,48 @@ +from typing import Union, List, Optional +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data +from fedot.core.data.data import InputData, OutputData +from sklearn.svm import OneClassSVM +from sklearn.preprocessing import StandardScaler +from sklearn.model_selection import GridSearchCV +from sklearn.base import ClassifierMixin, BaseEstimator +from sktime.classification.dictionary_based import MUSE, WEASEL +from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation +from fedot.core.operations.operation_parameters import OperationParameters +from fedot.core.repository.dataset_types import DataTypesEnum +from fedot.core.repository.tasks import Task, TaskTypesEnum +from fedot_ind.core.models.early_tc.base_early_tc import BaseETC + +class ProbabilityThresholdClassifier(BaseETC): + def __init__(self, params: Optional[OperationParameters] = None): + if params is None: + params = {} + super().__init__() + self.probability_threshold = params.get('probability_threshold', 0.85) + + def predict_proba(self, X): + _, predicted_probas, non_acceptance = self._predict(X) + predicted_probas[non_acceptance] = 0 + return predicted_probas.squeeze() + + def predict(self, X): + predicted_labels, _, non_acceptance = self._predict(X) + predicted_labels[non_acceptance] = -1 + # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] + return predicted_labels # prediction_points x n_instances + + def _predict(self, X): + predicted_labels, predicted_probas = super()._predict(X) + non_acceptance = self._consecutive_count(predicted_labels) < self.acceptance_threshold + to_second_check = np.argwhere(non_acceptance) + predicted_probas = np.stack(predicted_probas) + predicted_labels = np.stack(predicted_labels) + # for each point of estimation + for i in range(predicted_labels.shape[0]): + # find not accepted points + ith_point_to_oc = to_second_check[to_second_check[:, 0] == i, 1] + # if they are not outliers + final_verdict = (predicted_probas[i, ith_point_to_oc] > self.acceptance_threshold).any() + # mark as accepted + non_acceptance[i, np.argwhere(final_verdict >= 0).flatten()] = False + return predicted_labels, predicted_probas, non_acceptance diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 66a031fd4..0f08a9063 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -1,51 +1,32 @@ from typing import Union, List, Optional from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data from fedot.core.data.data import InputData, OutputData from sklearn.svm import OneClassSVM from sklearn.preprocessing import StandardScaler from sklearn.model_selection import GridSearchCV +from sklearn.base import ClassifierMixin, BaseEstimator from sktime.classification.dictionary_based import MUSE, WEASEL from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation from fedot.core.operations.operation_parameters import OperationParameters +from fedot.core.repository.dataset_types import DataTypesEnum +from fedot.core.repository.tasks import Task, TaskTypesEnum +from fedot_ind.core.models.early_tc.base_early_tc import BaseETC -class TEASER(ModelImplementation): +class TEASER(BaseETC): def __init__(self, params: Optional[OperationParameters] = None): - super().__init__() - if params is None: - params = {} - self.prediction_mode = params.get('prediction_mode', 'best_by_harmonic_mean') - self.interval_length = params.get('interval_length', 10) # rewrite as interval_length - self.acceptance_threshold = params.get('acceptance_threshold', 5) - self.hm_shift_to_acc = params.get('hm_shift_to_acc', 1.) - assert self.acceptance_threshold < self.interval_length, 'Not enough checkpoints for prediction proof' - - # how to pass into ? % what needed - self._oc_svm_params = [100, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1.5, 1] + super().__init__(params) + self._oc_svm_params = (100., 10., 5., 2.5, 1.5, 1., 0.5, 0.25, 0.1) self.weasel_params = {} self.random_state = None # is needed? - def _init_model(self, max_data_length): - self.prediction_idx = self._compute_prediction_points(max_data_length) - self.n_pred = len(self.prediction_idx) + def _init_model(self, X, y): + super()._init_model(X, y) self.oc_estimators = [None] * self.n_pred - self.slave_estimators = [WEASEL(random_state=self.random_state, support_probabilities=True, **self.weasel_params) for _ in range(self.n_pred)] - self.scalers = [StandardScaler() for _ in range(self.n_pred)] - self.__offset = max_data_length % self.interval_length - self.best_estimator_idx = -1 - - def fit(self, input_data: InputData): - input_data = self.__convert_pd(input_data) - X, y = input_data.features, input_data.target # what's passed in case of classification to training? - self._init_model(max_data_length=X.shape[-1]) - for i in range(self.n_pred): - self._fit_one_interval(X, y, i) - self.best_estimator_idx = np.argmax(self._score(X, y, self.hm_shift_to_acc)) def _fit_one_interval(self, X, y, i): - X_part = X[..., :self.prediction_idx[i] + 1] # what's dimensionality of input? will it work in case of multivariate? - X_part = self.scalers[i].fit_transform(X_part) - probas = self.slave_estimators[i].fit_predict_proba(X_part, y) + probas = super()._fit_one_interval(X, y, i) filtered_probas = self._filter_trues(probas, y) # X_oc = self._form_X_oc(filtered_probas) self.oc_estimators[i] = GridSearchCV(OneClassSVM(), @@ -55,17 +36,9 @@ def _fit_one_interval(self, X, y, i): ).fit(X_oc, np.ones((len(X_oc), 1))).best_estimator_ def _predict_one_slave(self, X, i, offset=0): - X_part = X[..., max(0, offset - 1):self.prediction_idx[i] + 1] - X_part = self.scalers[i].transform(X_part) - probas = self.slave_estimators[i].predict_proba(X_part) + probas, labels = super()._predict_one_slave(X, i, offset) X_oc = self._form_X_oc(probas) - return X_oc, np.argmax(probas, axis=-1) - - def _compute_prediction_points(self, n_idx): - """Computes indices for prediction, includes last index, first interval may be greater""" - prediction_idx = np.arange(n_idx - 1, -1, -self.interval_length)[::-1] - self.earliness = 1 - prediction_idx / n_idx - return prediction_idx + return X_oc, probas, labels def _filter_trues(self, predicted_probas, y): # different logic in sktime predicted_labels = np.argmax(predicted_probas, axis=-1).flatten() @@ -78,67 +51,35 @@ def _form_X_oc(self, predicted_probas): return np.hstack([predicted_probas, d]) def _predict(self, X): - n = X.shape[0] - self.states = np.ones((n, self.n_pred, 2)) # num_consec, class - if self.prediction_mode == 'best_by_harmonic_mean': - estimator_indices = [self.best_estimator_idx] - else: - last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) - estimator_indices = list(range(last_idx + 1)) - X_ocs, predicted_labels = zip( + estimator_indices, offset = self._select_estimators(X) + X_ocs, predicted_probas, predicted_labels = zip( *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary ) non_acceptance = self._consecutive_count(predicted_labels) < self.acceptance_threshold to_oc_check = np.argwhere(non_acceptance) X_ocs = np.stack(X_ocs) + predicted_probas = np.stack(predicted_probas) predicted_labels = np.stack(predicted_labels) + final_verdicts = np.zeros((len(estimator_indices), X.shape[0])) # for each point of estimation for i in range(predicted_labels.shape[0]): # find not accepted points ith_point_to_oc = to_oc_check[to_oc_check[:, 0] == i, 1] X_to_ith = X_ocs[i][ith_point_to_oc] # if they are not outliers - final_verdict = self.oc_estimators[i].predict(X_to_ith) # 1 for accept -1 for reject + final_verdict = self.oc_estimators[estimator_indices[i]].decision_function(X_to_ith) # 1 for accept -1 for reject # mark as accepted - non_acceptance[i, np.argwhere(final_verdict == 1).flatten()] = False + non_acceptance[i, np.argwhere(final_verdict >= 0).flatten()] = False + final_verdicts[i] = final_verdict + return predicted_labels, predicted_probas, non_acceptance, final_verdicts + + def predict_proba(self, X): + _, predicted_probas, non_acceptance, final_verdicts = self._predict(X) + predicted_probas[non_acceptance] = final_verdicts[non_acceptance, None] + return predicted_probas.squeeze() + + def predict(self, X): + predicted_labels, _, non_acceptance, final_verdicts = self._predict(X) predicted_labels[non_acceptance] = -1 + # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] return predicted_labels # prediction_points x n_instances - - def _consecutive_count(self, predicted_labels: List[np.array]): - n = len(predicted_labels[0]) - prediction_points = len(predicted_labels) - consecutive_labels = np.ones((prediction_points, n)) - for i in range(1, prediction_points): - equal = predicted_labels[i - 1] == predicted_labels[i] - consecutive_labels[i, equal] = consecutive_labels[i - 1, equal] + 1 - return consecutive_labels # prediction_points x n_instances - - def __convert_pd(self, input_data): - if hasattr(input_data.features, 'values'): - input_data.features = input_data.features.values - if hasattr(input_data.target, 'values'): - input_data.target = input_data.target.values - return input_data - - def predict(self, input_data: InputData) -> OutputData: - input_data = self.__convert_pd(input_data) - prediction = self._predict(input_data.features) - return self._convert_to_output(input_data, predict=prediction) - - def predict_for_fit(self, input_data: InputData) -> OutputData: - return self.predict(input_data) - - def _score(self, X, y, hm_shift_to_acc=None): - hm_shift_to_acc = hm_shift_to_acc or self.hm_shift_to_acc - predictions = self._predict(X) - prediction_points = predictions.shape[0] - accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) - return (1 + hm_shift_to_acc) * accuracies * self.earliness[:prediction_points] / (hm_shift_to_acc * accuracies + self.earliness[:prediction_points]) - - def _get_applicable_index(self, last_available_idx): - idx = np.searchsorted(self.prediction_idx, last_available_idx, side='right') - if idx == 0: - raise RuntimeError('Too few points for prediction!') - idx -= 1 - offset = last_available_idx - self.prediction_idx[idx] - return idx, offset From 5ac6f70fb514db63a4a146520852c80e5c1b25e8 Mon Sep 17 00:00:00 2001 From: leostre Date: Thu, 27 Jun 2024 18:22:34 +0300 Subject: [PATCH 06/43] class tree reconf. added proba_thresholding classifier (not registered) --- .../core/models/early_tc/base_early_tc.py | 117 +++++++++++++++++ .../core/models/early_tc/prob_threshold.py | 46 +++++++ fedot_ind/core/models/early_tc/teaser.py | 123 +++++------------- 3 files changed, 194 insertions(+), 92 deletions(-) create mode 100644 fedot_ind/core/models/early_tc/base_early_tc.py create mode 100644 fedot_ind/core/models/early_tc/prob_threshold.py diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py new file mode 100644 index 000000000..f97ba0593 --- /dev/null +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -0,0 +1,117 @@ +from typing import Union, List, Optional +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data +from fedot.core.data.data import InputData, OutputData +from sklearn.svm import OneClassSVM +from sklearn.preprocessing import StandardScaler +from sklearn.model_selection import GridSearchCV +from sklearn.base import ClassifierMixin, BaseEstimator +from sktime.classification.dictionary_based import MUSE, WEASEL +from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation +from fedot.core.operations.operation_parameters import OperationParameters +from fedot.core.repository.dataset_types import DataTypesEnum +from fedot.core.repository.tasks import Task, TaskTypesEnum + + +class BaseETC(ClassifierMixin, BaseEstimator): + def __init__(self, params: Optional[OperationParameters] = None): + if params is None: + params = {} + super().__init__() + self.prediction_mode = params.get('prediction_mode', 'best_by_harmonic_mean') + self.interval_percentage = params.get('interval_percentage', 10) + self.consecutive_predictions = params.get('consecutive_predictions', 3) + self.hm_shift_to_acc = params.get('hm_shift_to_acc', 1.) + self.random_state = params.get('random_state', None) + self.weasel_params = {} + assert self.consecutive_predictions < self.interval_percentage, 'Not enough checkpoints for prediction proof' + + def _init_model(self, X, y): + max_data_length = X.shape[-1] + self.prediction_idx = self._compute_prediction_points(max_data_length) + self.n_pred = len(self.prediction_idx) + self.slave_estimators = [WEASEL(random_state=self.random_state, support_probabilities=True, **self.weasel_params) for _ in range(self.n_pred)] + self.scalers = [StandardScaler() for _ in range(self.n_pred)] + self._best_estimator_idx = -1 + self.classes_ = [np.unique(y)] + + @property + def required_length(self): + if not hasattr(self, '_best_estimator_idx'): + return None + return self.prediction_idx[self._best_estimator_idx] + + def fit(self, X, y=None): + assert y is not None, 'Pass y' + y = np.array(y).flatten() + self._init_model(X, y) + for i in range(self.n_pred): + self._fit_one_interval(X, y, i) + self._best_estimator_idx = np.argmax(self._score(X, y, self.hm_shift_to_acc)) + + def _fit_one_interval(self, X, y, i): + X_part = X[..., :self.prediction_idx[i] + 1] # what's dimensionality of input? will it work in case of multivariate? + X_part = self.scalers[i].fit_transform(X_part) + probas = self.slave_estimators[i].fit_predict_proba(X_part, y) + return probas + + def _predict_one_slave(self, X, i, offset=0): + X_part = X[..., max(0, offset - 1):self.prediction_idx[i] + 1] + X_part = self.scalers[i].transform(X_part) + probas = self.slave_estimators[i].predict_proba(X_part) + return probas, np.argmax(probas, axis=-1) + + def _compute_prediction_points(self, n_idx): + interval_length = int(n_idx * self.interval_percentage / 100) + prediction_idx = np.arange(n_idx - 1, -1, -interval_length)[::-1] + self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 + return prediction_idx + + def _select_estimators(self, X): + offset = 0 + if self.prediction_mode == 'best_by_harmonic_mean': + estimator_indices = [self._best_estimator_idx] + elif self.prediction_mode == 'all': + last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) + estimator_indices = np.arange(last_idx + 1) + else: + raise ValueError('Unknown prediction mode') + return estimator_indices, offset + + def _predict(self, X,): + estimator_indices, offset = self._select_estimators(X) + predicted_probas, predicted_labels = zip( + *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary + ) + return predicted_labels, predicted_probas + + def _consecutive_count(self, predicted_labels: List[np.array]): + n = len(predicted_labels[0]) + prediction_points = len(predicted_labels) + consecutive_labels = np.ones((prediction_points, n)) + for i in range(1, prediction_points): + equal = predicted_labels[i - 1] == predicted_labels[i] + consecutive_labels[i, equal] = consecutive_labels[i - 1, equal] + 1 + return consecutive_labels # prediction_points x n_instances + + def predict_proba(self, X): + raise NotImplementedError + + def predict(self, X): + raise NotImplementedError + + def _score(self, X, y, hm_shift_to_acc=None): + y = np.array(y).flatten() + hm_shift_to_acc = hm_shift_to_acc or self.hm_shift_to_acc + predictions, *_ = self._predict(X) + prediction_points = predictions.shape[0] + accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) + return (1 + hm_shift_to_acc) * accuracies * self.earliness[:prediction_points] / (hm_shift_to_acc * accuracies + self.earliness[:prediction_points]) + + def _get_applicable_index(self, last_available_idx): + idx = np.searchsorted(self.prediction_idx, last_available_idx, side='right') + if idx == 0: + raise RuntimeError('Too few points for prediction!') + idx -= 1 + offset = last_available_idx - self.prediction_idx[idx] + return idx, offset diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py new file mode 100644 index 000000000..0433de34a --- /dev/null +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -0,0 +1,46 @@ +from typing import Union, List, Optional +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data +from fedot.core.data.data import InputData, OutputData +from sklearn.svm import OneClassSVM +from sklearn.preprocessing import StandardScaler +from sklearn.model_selection import GridSearchCV +from sklearn.base import ClassifierMixin, BaseEstimator +from sktime.classification.dictionary_based import MUSE, WEASEL +from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation +from fedot.core.operations.operation_parameters import OperationParameters +from fedot.core.repository.dataset_types import DataTypesEnum +from fedot.core.repository.tasks import Task, TaskTypesEnum +from fedot_ind.core.models.early_tc.base_early_tc import BaseETC + +class ProbabilityThresholdClassifier(BaseETC): + def __init__(self, params: Optional[OperationParameters] = None): + if params is None: + params = {} + super().__init__() + self.probability_threshold = params.get('probability_threshold', None) + + def _init_model(self, X, y): + super()._init_model(X, y) + if self.probability_threshold is None: + self.probability_threshold = 1 / len(self.classes_[0]) + + def predict_proba(self, X): + _, predicted_probas, non_acceptance = self._predict(X) + predicted_probas[non_acceptance] = 0 + return predicted_probas.squeeze() + + def predict(self, X): + predicted_labels, _, non_acceptance = self._predict(X) + predicted_labels[non_acceptance] = -1 + # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] + return predicted_labels # prediction_points x n_instances + + def _predict(self, X): + predicted_labels, predicted_probas = super()._predict(X) + predicted_probas = np.stack(predicted_probas) + predicted_labels = np.stack(predicted_labels) + non_acceptance = self._consecutive_count(predicted_labels) < self.consecutive_predictions + double_check = predicted_probas.max(axis=-1) > self.probability_threshold + non_acceptance[non_acceptance & double_check] = False + return predicted_labels, predicted_probas, non_acceptance diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 66a031fd4..2809824c8 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -1,51 +1,30 @@ from typing import Union, List, Optional from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data from fedot.core.data.data import InputData, OutputData from sklearn.svm import OneClassSVM from sklearn.preprocessing import StandardScaler from sklearn.model_selection import GridSearchCV +from sklearn.base import ClassifierMixin, BaseEstimator from sktime.classification.dictionary_based import MUSE, WEASEL from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation from fedot.core.operations.operation_parameters import OperationParameters +from fedot.core.repository.dataset_types import DataTypesEnum +from fedot.core.repository.tasks import Task, TaskTypesEnum +from fedot_ind.core.models.early_tc.base_early_tc import BaseETC -class TEASER(ModelImplementation): +class TEASER(BaseETC): def __init__(self, params: Optional[OperationParameters] = None): - super().__init__() - if params is None: - params = {} - self.prediction_mode = params.get('prediction_mode', 'best_by_harmonic_mean') - self.interval_length = params.get('interval_length', 10) # rewrite as interval_length - self.acceptance_threshold = params.get('acceptance_threshold', 5) - self.hm_shift_to_acc = params.get('hm_shift_to_acc', 1.) - assert self.acceptance_threshold < self.interval_length, 'Not enough checkpoints for prediction proof' + super().__init__(params) + self._oc_svm_params = (100., 10., 5., 2.5, 1.5, 1., 0.5, 0.25, 0.1) - # how to pass into ? % what needed - self._oc_svm_params = [100, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1.5, 1] - self.weasel_params = {} - self.random_state = None # is needed? - - def _init_model(self, max_data_length): - self.prediction_idx = self._compute_prediction_points(max_data_length) - self.n_pred = len(self.prediction_idx) + def _init_model(self, X, y): + super()._init_model(X, y) self.oc_estimators = [None] * self.n_pred - self.slave_estimators = [WEASEL(random_state=self.random_state, support_probabilities=True, **self.weasel_params) for _ in range(self.n_pred)] - self.scalers = [StandardScaler() for _ in range(self.n_pred)] - self.__offset = max_data_length % self.interval_length - self.best_estimator_idx = -1 - - def fit(self, input_data: InputData): - input_data = self.__convert_pd(input_data) - X, y = input_data.features, input_data.target # what's passed in case of classification to training? - self._init_model(max_data_length=X.shape[-1]) - for i in range(self.n_pred): - self._fit_one_interval(X, y, i) - self.best_estimator_idx = np.argmax(self._score(X, y, self.hm_shift_to_acc)) def _fit_one_interval(self, X, y, i): - X_part = X[..., :self.prediction_idx[i] + 1] # what's dimensionality of input? will it work in case of multivariate? - X_part = self.scalers[i].fit_transform(X_part) - probas = self.slave_estimators[i].fit_predict_proba(X_part, y) + probas = super()._fit_one_interval(X, y, i) filtered_probas = self._filter_trues(probas, y) # X_oc = self._form_X_oc(filtered_probas) self.oc_estimators[i] = GridSearchCV(OneClassSVM(), @@ -55,17 +34,9 @@ def _fit_one_interval(self, X, y, i): ).fit(X_oc, np.ones((len(X_oc), 1))).best_estimator_ def _predict_one_slave(self, X, i, offset=0): - X_part = X[..., max(0, offset - 1):self.prediction_idx[i] + 1] - X_part = self.scalers[i].transform(X_part) - probas = self.slave_estimators[i].predict_proba(X_part) + probas, labels = super()._predict_one_slave(X, i, offset) X_oc = self._form_X_oc(probas) - return X_oc, np.argmax(probas, axis=-1) - - def _compute_prediction_points(self, n_idx): - """Computes indices for prediction, includes last index, first interval may be greater""" - prediction_idx = np.arange(n_idx - 1, -1, -self.interval_length)[::-1] - self.earliness = 1 - prediction_idx / n_idx - return prediction_idx + return X_oc, probas, labels def _filter_trues(self, predicted_probas, y): # different logic in sktime predicted_labels = np.argmax(predicted_probas, axis=-1).flatten() @@ -78,67 +49,35 @@ def _form_X_oc(self, predicted_probas): return np.hstack([predicted_probas, d]) def _predict(self, X): - n = X.shape[0] - self.states = np.ones((n, self.n_pred, 2)) # num_consec, class - if self.prediction_mode == 'best_by_harmonic_mean': - estimator_indices = [self.best_estimator_idx] - else: - last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) - estimator_indices = list(range(last_idx + 1)) - X_ocs, predicted_labels = zip( + estimator_indices, offset = self._select_estimators(X) + X_ocs, predicted_probas, predicted_labels = zip( *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary ) - non_acceptance = self._consecutive_count(predicted_labels) < self.acceptance_threshold + non_acceptance = self._consecutive_count(predicted_labels) < self.consecutive_predictions to_oc_check = np.argwhere(non_acceptance) X_ocs = np.stack(X_ocs) + predicted_probas = np.stack(predicted_probas) predicted_labels = np.stack(predicted_labels) + final_verdicts = np.zeros((len(estimator_indices), X.shape[0])) # for each point of estimation for i in range(predicted_labels.shape[0]): # find not accepted points ith_point_to_oc = to_oc_check[to_oc_check[:, 0] == i, 1] X_to_ith = X_ocs[i][ith_point_to_oc] # if they are not outliers - final_verdict = self.oc_estimators[i].predict(X_to_ith) # 1 for accept -1 for reject + final_verdict = self.oc_estimators[estimator_indices[i]].decision_function(X_to_ith) # 1 for accept -1 for reject # mark as accepted - non_acceptance[i, np.argwhere(final_verdict == 1).flatten()] = False + non_acceptance[i, np.argwhere(final_verdict >= 0).flatten()] = False + final_verdicts[i] = final_verdict + return predicted_labels, predicted_probas, non_acceptance, final_verdicts + + def predict_proba(self, X): + _, predicted_probas, non_acceptance, final_verdicts = self._predict(X) + predicted_probas[non_acceptance] = final_verdicts[non_acceptance, None] + return predicted_probas.squeeze() + + def predict(self, X): + predicted_labels, _, non_acceptance, final_verdicts = self._predict(X) predicted_labels[non_acceptance] = -1 + # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] return predicted_labels # prediction_points x n_instances - - def _consecutive_count(self, predicted_labels: List[np.array]): - n = len(predicted_labels[0]) - prediction_points = len(predicted_labels) - consecutive_labels = np.ones((prediction_points, n)) - for i in range(1, prediction_points): - equal = predicted_labels[i - 1] == predicted_labels[i] - consecutive_labels[i, equal] = consecutive_labels[i - 1, equal] + 1 - return consecutive_labels # prediction_points x n_instances - - def __convert_pd(self, input_data): - if hasattr(input_data.features, 'values'): - input_data.features = input_data.features.values - if hasattr(input_data.target, 'values'): - input_data.target = input_data.target.values - return input_data - - def predict(self, input_data: InputData) -> OutputData: - input_data = self.__convert_pd(input_data) - prediction = self._predict(input_data.features) - return self._convert_to_output(input_data, predict=prediction) - - def predict_for_fit(self, input_data: InputData) -> OutputData: - return self.predict(input_data) - - def _score(self, X, y, hm_shift_to_acc=None): - hm_shift_to_acc = hm_shift_to_acc or self.hm_shift_to_acc - predictions = self._predict(X) - prediction_points = predictions.shape[0] - accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) - return (1 + hm_shift_to_acc) * accuracies * self.earliness[:prediction_points] / (hm_shift_to_acc * accuracies + self.earliness[:prediction_points]) - - def _get_applicable_index(self, last_available_idx): - idx = np.searchsorted(self.prediction_idx, last_available_idx, side='right') - if idx == 0: - raise RuntimeError('Too few points for prediction!') - idx -= 1 - offset = last_available_idx - self.prediction_idx[idx] - return idx, offset From 48e83289bc8bfe0b22bbca86e9be286311522e93 Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 28 Jun 2024 14:11:17 +0300 Subject: [PATCH 07/43] both etc models are registered, available via api --- fedot_ind/core/models/early_tc/base_early_tc.py | 11 ++--------- .../core/models/early_tc/prob_threshold.py | 12 +----------- fedot_ind/core/models/early_tc/teaser.py | 10 +--------- .../data/default_operation_params.json | 9 +++++++-- .../data/industrial_model_repository.json | 17 +++++++++++++---- fedot_ind/core/repository/model_repository.py | 4 +++- fedot_ind/core/tuning/search_space.py | 12 ++++++++++-- 7 files changed, 37 insertions(+), 38 deletions(-) diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index f97ba0593..c7b84bedf 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -1,16 +1,9 @@ -from typing import Union, List, Optional +from typing import Optional, List from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data -from fedot.core.data.data import InputData, OutputData -from sklearn.svm import OneClassSVM from sklearn.preprocessing import StandardScaler -from sklearn.model_selection import GridSearchCV from sklearn.base import ClassifierMixin, BaseEstimator -from sktime.classification.dictionary_based import MUSE, WEASEL -from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation +from sktime.classification.dictionary_based import WEASEL from fedot.core.operations.operation_parameters import OperationParameters -from fedot.core.repository.dataset_types import DataTypesEnum -from fedot.core.repository.tasks import Task, TaskTypesEnum class BaseETC(ClassifierMixin, BaseEstimator): diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index 0433de34a..343077cbe 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -1,16 +1,6 @@ -from typing import Union, List, Optional +from typing import Optional from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data -from fedot.core.data.data import InputData, OutputData -from sklearn.svm import OneClassSVM -from sklearn.preprocessing import StandardScaler -from sklearn.model_selection import GridSearchCV -from sklearn.base import ClassifierMixin, BaseEstimator -from sktime.classification.dictionary_based import MUSE, WEASEL -from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation from fedot.core.operations.operation_parameters import OperationParameters -from fedot.core.repository.dataset_types import DataTypesEnum -from fedot.core.repository.tasks import Task, TaskTypesEnum from fedot_ind.core.models.early_tc.base_early_tc import BaseETC class ProbabilityThresholdClassifier(BaseETC): diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 2809824c8..f5d2590b3 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -1,16 +1,8 @@ -from typing import Union, List, Optional +from typing import Optional from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data -from fedot.core.data.data import InputData, OutputData from sklearn.svm import OneClassSVM -from sklearn.preprocessing import StandardScaler from sklearn.model_selection import GridSearchCV -from sklearn.base import ClassifierMixin, BaseEstimator -from sktime.classification.dictionary_based import MUSE, WEASEL -from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation from fedot.core.operations.operation_parameters import OperationParameters -from fedot.core.repository.dataset_types import DataTypesEnum -from fedot.core.repository.tasks import Task, TaskTypesEnum from fedot_ind.core.models.early_tc.base_early_tc import BaseETC diff --git a/fedot_ind/core/repository/data/default_operation_params.json b/fedot_ind/core/repository/data/default_operation_params.json index 1bbcc8614..52536d5cb 100644 --- a/fedot_ind/core/repository/data/default_operation_params.json +++ b/fedot_ind/core/repository/data/default_operation_params.json @@ -131,8 +131,13 @@ "bootstrap": false }, "teaser": { - "interval_length": 10, - "acceptance_threshold": 3, + "interval_percentage": 10, + "consecutive_predictions": 3, + "hm_shift_to_acc": 2 + }, + "proba_threshold_etc": { + "interval_percentage": 10, + "consecutive_predictions": 3, "hm_shift_to_acc": 2 }, "dt": { diff --git a/fedot_ind/core/repository/data/industrial_model_repository.json b/fedot_ind/core/repository/data/industrial_model_repository.json index 8fb12f6de..309d5c56c 100644 --- a/fedot_ind/core/repository/data/industrial_model_repository.json +++ b/fedot_ind/core/repository/data/industrial_model_repository.json @@ -511,7 +511,7 @@ }, "ridge": { "meta": "sklearn_regr", - "presets": ["fast_train", "ts"], + "presets": ["fast_train"], "tags": [ "simple", "linear", @@ -618,15 +618,24 @@ ] }, "teaser": { - "meta": "ts_model", - "presets": ["fast_train", "ts"], + "meta": "sklearn_class", "tags": [ "simple", "interpretable", "non_lagged", "non_linear" ], - "input_type": "[DataTypesEnum.ts]" + "input_type": "[DataTypesEnum.table]" + }, + "proba_threshold_etc": { + "meta": "sklearn_class", + "tags": [ + "simple", + "interpretable", + "non_lagged", + "non_linear" + ], + "input_type": "[DataTypesEnum.table]" }, "xgboost": { "meta": "sklearn_class", diff --git a/fedot_ind/core/repository/model_repository.py b/fedot_ind/core/repository/model_repository.py index a984cbd38..908622195 100644 --- a/fedot_ind/core/repository/model_repository.py +++ b/fedot_ind/core/repository/model_repository.py @@ -45,6 +45,7 @@ from xgboost import XGBRegressor from fedot_ind.core.models.early_tc.teaser import TEASER +from fedot_ind.core.models.early_tc.prob_threshold import ProbabilityThresholdClassifier from fedot_ind.core.models.manifold.riemann_embeding import RiemannExtractor from fedot_ind.core.models.nn.network_impl.dummy_nn import DummyOverComplicatedNeuralNetwork from fedot_ind.core.models.nn.network_impl.deepar import DeepAR @@ -135,7 +136,8 @@ class AtomizedModel(Enum): # external models 'lgbm': LGBMClassifier, # Early classification - 'teaser': TEASER + 'teaser': TEASER, + 'proba_threshold_etc': ProbabilityThresholdClassifier } FEDOT_PREPROC_MODEL = { # data standartization diff --git a/fedot_ind/core/tuning/search_space.py b/fedot_ind/core/tuning/search_space.py index 37849840d..11be89db9 100644 --- a/fedot_ind/core/tuning/search_space.py +++ b/fedot_ind/core/tuning/search_space.py @@ -68,15 +68,23 @@ 'hm_shift_to_acc': {'hyperopt-dist': hp.choice, 'sampling-scope': [0.01, 0.1, 0.5, 1, 5, 10, 100]}, }, + 'proba_threshold_etc': + {'interval_percentage': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[5, 10, 20, 25]]}, + 'acceptance_threshold': {'hyperopt-dist': hp.choice, + 'sampling_scope': [[1, 2, 3, 4, 5]]}, + 'hm_shift_to_acc': {'hyperopt-dist': hp.choice, + 'sampling-scope': [0.01, 0.1, 0.5, 1, 5, 10, 100]}, + }, 'deepar_model': {'epochs': {'hyperopt-dist': hp.choice, 'sampling-scope': [[x for x in range(10, 100, 10)]]}, 'batch_size': {'hyperopt-dist': hp.choice, 'sampling-scope': [[x for x in range(8, 64, 6)]]}, 'dropout': {'hyperopt-dist': hp.choice, - 'sampling-scope': [list(range(0, 0.6, 0.1))]}, + 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5]]}, 'rnn_layers':{'hyperopt-dist': hp.choice, - 'sampling-scope': [range(1, 6)]}, + 'sampling-scope': [list(range(1, 6))]}, 'hidden_size':{'hyperopt-dist': hp.choice, 'sampling-scope': [list(range(10, 101, 10))]}, 'cell_type':{'hyperopt-dist': hp.choice, From 18a895ae8440910ee008b3fb498d89bf842c19b4 Mon Sep 17 00:00:00 2001 From: leostre Date: Tue, 2 Jul 2024 15:27:34 +0300 Subject: [PATCH 08/43] ecec added --- .../core/models/early_tc/base_early_tc.py | 22 ++++--- fedot_ind/core/models/early_tc/ecec.py | 62 +++++++++++++++++++ .../core/models/early_tc/prob_threshold.py | 19 ++++-- fedot_ind/core/models/early_tc/teaser.py | 9 +++ 4 files changed, 99 insertions(+), 13 deletions(-) create mode 100644 fedot_ind/core/models/early_tc/ecec.py diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index c7b84bedf..5da8e61bd 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -33,6 +33,10 @@ def required_length(self): if not hasattr(self, '_best_estimator_idx'): return None return self.prediction_idx[self._best_estimator_idx] + + @property + def n_classes(self): + return len(self.classes_[0]) def fit(self, X, y=None): assert y is not None, 'Pass y' @@ -40,7 +44,6 @@ def fit(self, X, y=None): self._init_model(X, y) for i in range(self.n_pred): self._fit_one_interval(X, y, i) - self._best_estimator_idx = np.argmax(self._score(X, y, self.hm_shift_to_acc)) def _fit_one_interval(self, X, y, i): X_part = X[..., :self.prediction_idx[i] + 1] # what's dimensionality of input? will it work in case of multivariate? @@ -60,23 +63,23 @@ def _compute_prediction_points(self, n_idx): self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 return prediction_idx - def _select_estimators(self, X): + def _select_estimators(self, X, training=False): offset = 0 - if self.prediction_mode == 'best_by_harmonic_mean': + if not training and self.prediction_mode == 'best_by_harmonic_mean': estimator_indices = [self._best_estimator_idx] - elif self.prediction_mode == 'all': + elif training or self.prediction_mode == 'all': last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) estimator_indices = np.arange(last_idx + 1) else: raise ValueError('Unknown prediction mode') return estimator_indices, offset - def _predict(self, X,): - estimator_indices, offset = self._select_estimators(X) - predicted_probas, predicted_labels = zip( + def _predict(self, X, training=True): + estimator_indices, offset = self._select_estimators(X, training) + prediction = zip( *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary ) - return predicted_labels, predicted_probas + return prediction # see the output in _predict_one_slave def _consecutive_count(self, predicted_labels: List[np.array]): n = len(predicted_labels[0]) @@ -96,11 +99,12 @@ def predict(self, X): def _score(self, X, y, hm_shift_to_acc=None): y = np.array(y).flatten() hm_shift_to_acc = hm_shift_to_acc or self.hm_shift_to_acc - predictions, *_ = self._predict(X) + predictions = self._predict(X)[0] prediction_points = predictions.shape[0] accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) return (1 + hm_shift_to_acc) * accuracies * self.earliness[:prediction_points] / (hm_shift_to_acc * accuracies + self.earliness[:prediction_points]) + def _get_applicable_index(self, last_available_idx): idx = np.searchsorted(self.prediction_idx, last_available_idx, side='right') if idx == 0: diff --git a/fedot_ind/core/models/early_tc/ecec.py b/fedot_ind/core/models/early_tc/ecec.py new file mode 100644 index 000000000..a00df631d --- /dev/null +++ b/fedot_ind/core/models/early_tc/ecec.py @@ -0,0 +1,62 @@ +from typing import Optional +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot.core.operations.operation_parameters import OperationParameters +from fedot_ind.core.models.early_tc.base_early_tc import BaseETC +from sklearn.model_selection import cross_val_predict +from sklearn.base import clone +from sklearn.metrics import confusion_matrix + +class ECEC(BaseETC): + def __init__(self, params: Optional[OperationParameters] = None): + super().__init__(params) + + def _init_model(self, X, y): + super()._init_model(X, y) + self._confidences = np.ones((X.shape[0], self.n_pred)) + + def _score(self, X, y, alpha): + y = y.astype(int) + predicted_labels = np.stack(super()._predict(X)[0]).astype(int) # n_pred x n_inst + n = predicted_labels.shape[0] + accuracies = (predicted_labels == np.tile(y, (1, n))) # n_pred x n_inst + confidences = np.ones((n, X.shape[0]), dtype='float32') + for i in range(n): + y_pred = predicted_labels[i] + reliability_i = confusion_matrix(y, y_pred, normalize='pred') + confidences[i] = 1 - reliability_i[y, y_pred] # n_inst + confidences = 1 - np.cumprod(confidences, axis=0) # n_pred x n_inst + candidates = self._select_thrs(confidences) # n_candidates + cfs = np.zeros_like(candidates) + for i, candidate in enumerate(candidates): + mask = confidences >= candidate # n_pred x n_inst + accuracy_for_candidate = (accuracies * mask).sum(1) / mask.sum(1) # n_pred + cfs[i] = self.cost_func(self.earliness, accuracy_for_candidate, alpha) + return candidates[np.argmin(cfs)] + + @staticmethod + def _select_thrs(confidences): + C = np.unique(confidences.round(3)) + difference = np.diff(C) + pair_means = C[:-1] + difference / 2 + difference_shifted = np.roll(difference, 1) + difference_idx = np.argwhere(difference > difference_shifted) + return pair_means[difference_idx].flatten() + + @staticmethod + def cost_func(earliness, accuracies, alpha): + return alpha * accuracies + (1 - alpha) * earliness + + def fit(self, X, y): + self.confidence_threshold = super().fit(X, y) + + + + + + + + + + + + diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index 47fb76142..bfcccace5 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -21,16 +21,27 @@ def predict_proba(self, X): return predicted_probas.squeeze() def predict(self, X): - predicted_labels, _, non_acceptance = self._predict(X) + predicted_labels, _, non_acceptance = self._predict(X, training=False) predicted_labels[non_acceptance] = -1 # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] return predicted_labels # prediction_points x n_instances - def _predict(self, X): - predicted_labels, predicted_probas = super()._predict(X) + def _predict(self, X, training=True): + predicted_probas, predicted_labels = super()._predict(X, training) predicted_probas = np.stack(predicted_probas) predicted_labels = np.stack(predicted_labels) + # print(predicted_labels.shape, predicted_probas.shape) non_acceptance = self._consecutive_count(predicted_labels) < self.consecutive_predictions double_check = predicted_probas.max(axis=-1) > self.probability_threshold non_acceptance[non_acceptance & double_check] = False - return predicted_labels, predicted_probas, non_acceptance \ No newline at end of file + return predicted_labels, predicted_probas, non_acceptance + + def _score(self, X, y, hm_shift_to_acc=None): + scores = super()._score(X, y, hm_shift_to_acc) + self._best_estimator_idx = np.argmax(scores) + return scores + + def fit(self, X, y): + super().fit(X, y) + return self._score(X, y, self.hm_shift_to_acc) + diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 713104099..5ed6accbe 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -75,3 +75,12 @@ def predict(self, X): predicted_labels[non_acceptance] = -1 # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] return predicted_labels # prediction_points x n_instances + + def _score(self, X, y, hm_shift_to_acc=None): + scores = super()._score(X, y, hm_shift_to_acc) + self._best_estimator_idx = np.argmax(scores) + return scores + + def fit(self, X, y): + super().fit(X, y) + return self._score(X, y, self.hm_shift_to_acc) From 0c10a07f8ec84bad39728589a07e751e814ffb47 Mon Sep 17 00:00:00 2001 From: leostre Date: Thu, 4 Jul 2024 18:23:13 +0300 Subject: [PATCH 09/43] economy_k added --- .../core/models/early_tc/base_early_tc.py | 9 +- fedot_ind/core/models/early_tc/economy_k.py | 89 +++++++++++++++++++ .../core/models/early_tc/prob_threshold.py | 6 +- fedot_ind/core/models/early_tc/teaser.py | 6 +- 4 files changed, 100 insertions(+), 10 deletions(-) create mode 100644 fedot_ind/core/models/early_tc/economy_k.py diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index 5da8e61bd..5e180c2a9 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -14,7 +14,8 @@ def __init__(self, params: Optional[OperationParameters] = None): self.prediction_mode = params.get('prediction_mode', 'best_by_harmonic_mean') self.interval_percentage = params.get('interval_percentage', 10) self.consecutive_predictions = params.get('consecutive_predictions', 3) - self.hm_shift_to_acc = params.get('hm_shift_to_acc', 1.) + self.accuracy_importance = params.get('accuracy_importance', 1.) + self.min_ts_length = params.get('min_ts_step', 3) self.random_state = params.get('random_state', None) self.weasel_params = {} assert self.consecutive_predictions < self.interval_percentage, 'Not enough checkpoints for prediction proof' @@ -58,8 +59,8 @@ def _predict_one_slave(self, X, i, offset=0): return probas, np.argmax(probas, axis=-1) def _compute_prediction_points(self, n_idx): - interval_length = int(n_idx * self.interval_percentage / 100) - prediction_idx = np.arange(n_idx - 1, -1, -interval_length)[::-1] + interval_length = max(int(n_idx * self.interval_percentage / 100), self.min_ts_length) + prediction_idx = np.arange(n_idx - 1, -1, -interval_length)[::-1][1:] self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 return prediction_idx @@ -98,7 +99,7 @@ def predict(self, X): def _score(self, X, y, hm_shift_to_acc=None): y = np.array(y).flatten() - hm_shift_to_acc = hm_shift_to_acc or self.hm_shift_to_acc + hm_shift_to_acc = hm_shift_to_acc or self.accuracy_importance predictions = self._predict(X)[0] prediction_points = predictions.shape[0] accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py new file mode 100644 index 000000000..639e680cd --- /dev/null +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -0,0 +1,89 @@ +from typing import Optional +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot.core.operations.operation_parameters import OperationParameters +from fedot_ind.core.models.early_tc.base_early_tc import BaseETC +from sklearn.cluster import KMeans +from sklearn.metrics import confusion_matrix +from sklearn.model_selection import train_test_split, cross_val_predict + +class EconomyK(BaseETC): + def __init__(self, params: Optional[OperationParameters] = None): + if params is None: + params = {} + super().__init__(params) + self.lambda_ = params.get('lambda', 1.) + self._cluster_factor = params.get('cluster_factor' , 1) + self._random_state = 2104 + self.__cv = 5 + + def _init_model(self, X, y): + super()._init_model(X, y) + self.n_clusters = int(self._cluster_factor * self.n_classes) + self._clusterizer = KMeans(self.n_clusters, random_state=self._random_state) + self.state = np.zeros((self.n_pred, self.n_clusters, self.n_classes, self.n_classes)) + + def fit(self, X, y): + y = y.flatten().astype(int) + self._init_model(X, y) + self._pyck_ = confusion_matrix(y, self._clusterizer.fit(X).labels_, normalize='true')[:self.n_classes, :self.n_clusters] + for i in range(self.n_pred): + self._fit_one_interval(X, y, i) + + def _fit_one_interval(self, X, y, i): + X_part = X[..., :self.prediction_idx[i] + 1] + X_part = self.scalers[i].fit_transform(X_part) + y_pred = cross_val_predict(self.slave_estimators[i], X_part, y, cv=self.__cv) + self.slave_estimators[i].fit(X_part, y) + states_by_i = np.zeros(( self.n_clusters, self.n_classes, self.n_classes)) + np.add.at(states_by_i, (self._clusterizer.labels_, y, y_pred), 1) + states_by_i /= np.mean(states_by_i, -2, keepdims=True) + states_by_i[np.isnan(states_by_i)] = 0 + states_by_i[:, np.eye(self.n_classes).astype(bool)] = 0 + self.state[i] = states_by_i + + def _predict_one_slave(self, X, i, offset=0): + cluster_centers = self._clusterizer.cluster_centers_[:, :self.prediction_idx[i] + 1] # n_clust x len + X_part = X[..., max(0, offset - 1):self.prediction_idx[i] + 1] # n_inst x len + X_part = self.scalers[i].transform(X_part) + probas = self.slave_estimators[i].predict_proba(X_part) + optimal_time, is_optimal = self._get_prediction_time(X_part, cluster_centers, i) + return probas, optimal_time, is_optimal + + def __cluster_probas(self, X, centroids): + length = centroids.shape[-1] + diffs = np.subtract.outer(X, centroids).swapaxes(1, 2) + diffs = diffs[..., np.eye(length).astype(bool)] # n_inst x n_clust x len + distances = np.linalg.norm(diffs, axis=-1) + delta_k = 1. - distances / distances.mean(axis=-1)[:, None] + s = 1. / (1. + np.exp(-self.lambda_ * delta_k)) + return s / s.sum(axis=-1)[:, None] # n_inst x n_clust + + def __expected_costs(self, X, cluster_centroids, i): + cluster_probas = self.__cluster_probas(X, cluster_centroids) # n_inst x n_clust + s_glob = np.sum(np.transpose( + np.sum(self.state[i:], axis=-1), axes=(0, 2, 1) + ) * self._pyck_[None, ...], axis=1) + costs = cluster_probas @ s_glob.T # n_inst x time_left + costs += self.earliness[None, i:] * (1 - self.accuracy_importance) # subtract or add ? + return costs + + def _get_prediction_time(self, X, cluster_centroids, i): + costs = self.__expected_costs(X, cluster_centroids, i) + min_costs = np.argmin(costs, axis=-1) + is_optimal = min_costs == 0 + time_optimal = self.prediction_idx[min_costs + i] + return time_optimal, is_optimal # n_inst + + def predict_proba(self, X): + probas, times, is_optimal = self._predict(X) + is_optimal = np.stack(is_optimal) + idx = np.tile(np.arange(self.n_pred), (is_optimal.shape[1], 1)).T # n_pred x n_inst + idx[~is_optimal] = self.n_pred + idx = np.argmin(idx, 0) + probas = np.stack(probas) + return probas[idx], np.stack(times)[idx] + + def predict(self, X): + probas, times = self.predict_proba(X) + labels = probas.argmax(-1) + return labels, times diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index bfcccace5..51d169909 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -36,12 +36,12 @@ def _predict(self, X, training=True): non_acceptance[non_acceptance & double_check] = False return predicted_labels, predicted_probas, non_acceptance - def _score(self, X, y, hm_shift_to_acc=None): - scores = super()._score(X, y, hm_shift_to_acc) + def _score(self, X, y, accuracy_importance=None): + scores = super()._score(X, y, accuracy_importance) self._best_estimator_idx = np.argmax(scores) return scores def fit(self, X, y): super().fit(X, y) - return self._score(X, y, self.hm_shift_to_acc) + return self._score(X, y, self.accuracy_importance) diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 5ed6accbe..593a34e72 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -76,11 +76,11 @@ def predict(self, X): # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] return predicted_labels # prediction_points x n_instances - def _score(self, X, y, hm_shift_to_acc=None): - scores = super()._score(X, y, hm_shift_to_acc) + def _score(self, X, y, accuracy_importance=None): + scores = super()._score(X, y, accuracy_importance) self._best_estimator_idx = np.argmax(scores) return scores def fit(self, X, y): super().fit(X, y) - return self._score(X, y, self.hm_shift_to_acc) + return self._score(X, y, self.accuracy_importance) From 251bca6d7837fc29d68cdfef586304b5cfc06b59 Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 5 Jul 2024 12:30:52 +0300 Subject: [PATCH 10/43] mlstm init --- .../core/models/nn/network_impl/mlstm.py | 127 ++++++++++++++++++ 1 file changed, 127 insertions(+) create mode 100644 fedot_ind/core/models/nn/network_impl/mlstm.py diff --git a/fedot_ind/core/models/nn/network_impl/mlstm.py b/fedot_ind/core/models/nn/network_impl/mlstm.py new file mode 100644 index 000000000..31ca6fbd4 --- /dev/null +++ b/fedot_ind/core/models/nn/network_impl/mlstm.py @@ -0,0 +1,127 @@ +from fedot_ind.core.models.nn.network_impl.base_nn_model import BaseNeuralModel +from typing import Optional, Callable, Any, List, Union +from fedot.core.operations.operation_parameters import OperationParameters +from fedot.core.data.data import InputData, OutputData +from fedot_ind.core.repository.constanst_repository import CROSS_ENTROPY, MULTI_CLASS_CROSS_ENTROPY, RMSE +import torch.optim as optim +import torch.nn as nn +import torch.nn.functional as F +import torch +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array +import pandas as pd +from fedot.core.repository.tasks import Task, TaskTypesEnum, TsForecastingParams +from fedot_ind.core.models.nn.network_modules.layers.special import adjust_learning_rate, EarlyStopping +from fedot.core.repository.dataset_types import DataTypesEnum +from fedot_ind.core.architecture.preprocessing.data_convertor import DataConverter +import torch.utils.data as data +from fedot_ind.core.architecture.settings.computational import default_device + +class SqueezeExciteBlock(nn.Module): + def __init__(self, input_channels, filters, reduce=4): + super().__init__() + self.filters = filters + self.pool = nn.AvgPool1d(input_channels) + self.bottleneck = max(self.filters // reduce, 4) + self.fc1 = nn.Linear(self.filters, self.bottleneck, bias=False) + self.fc2 = nn.Linear(self.bottleneck, self.filters, bias=False) + torch.nn.init.kaiming_normal_(self.fc1.weight.data) + torch.nn.init.kaiming_normal_(self.fc2.weight.data) + + def forward(self, x): + input_x = x + x = self.pool(x) + x = F.relu(self.fc1(x.view(-1, 1, self.filters))) + x = F.sigmoid(self.fc2(x)) + x = x.view(-1, self.filters, 1) * input_x + return x + +class MLSTM_module(nn.Module): + def __init__(self, input_size, input_channels, + inner_size, inner_channels, + output_size, num_layers, dropout=0.25): + super().__init__() + self.proj = nn.Linear(input_size * inner_channels + input_channels * inner_size, output_size) + self.lstm = nn.LSTM(input_size, inner_size, num_layers, + batch_first=True, dropout=dropout) + self.conv_branch = nn.Sequential( + nn.Conv1d(input_channels, inner_channels, + padding='same', + kernel_size=9), + nn.BatchNorm1d(inner_channels), + nn.ReLU(), + SqueezeExciteBlock(input_size, inner_channels), + nn.Conv1d(inner_channels, inner_channels * 2, + padding='same', + kernel_size=5, + ), # c x l | n x c x l + nn.BatchNorm1d(inner_channels * 2), # n x c | n x c x l + nn.ReLU(), + SqueezeExciteBlock(input_size, inner_channels * 2), + nn.Conv1d(inner_channels * 2, inner_channels, + padding='same', + kernel_size=3, + ), # c x l | n x c x l + nn.BatchNorm1d(inner_channels), # n x c | n x c x l + nn.ReLU(), + ) + seq = next(iter(self.conv_branch.modules())) + idx = [0, 4, 8] + for i in idx: + torch.nn.init.kaiming_uniform_(seq[i].weight.data) + + def forward(self, x): + x_lstm, _ = self.lstm(x) # n x input_ch x inner_size + x_conv = self.conv_branch(x) # n x inner_ch x len + print(x_conv.size(), x_lstm.size()) + x = torch.cat([torch.flatten(x_lstm, start_dim=1), torch.flatten(x_conv, start_dim=1)], dim=-1) + x = F.softmax(self.proj(x)) + return x + + +class MLSTM(BaseNeuralModel): + def __init__(self, params: Optional[OperationParameters] = None): + if params is None: + params = {} + super().__init__() + # self.num_classes = params.get('num_classes', None) + # self.epochs = params.get('epochs', 100) + # self.batch_size = params.get('batch_size', 16) + # self.activation = params.get('activation', 'ReLU') + # self.learning_rate = 0.001 + + self.dropout = params.get('dropout', 0.25) + self.hidden_size = params.get('hidden_size', 64) + self.hidden_channels = params.get('hidden_channels', 32) + self.num_layers = params.get('num_layers', 2) + # self.target = None + # self.task_type = None + + def _init_model(self, ts: InputData): + _, input_channels, input_size = ts.features.shape + self.model = MLSTM_module(input_size, input_channels, + self.hidden_size, self.hidden_channels, + self.num_classes, self.num_layers, + self.dropout) + self.model_for_inference = MLSTM_module(input_size, input_channels, + self.hidden_size, self.hidden_channels, + self.num_classes, self.num_layers, + self.dropout) + optimizer = optim.Adam(self.model.parameters(), lr=0.001) + if ts.num_classes == 2: + loss_fn = CROSS_ENTROPY() + else: + loss_fn = MULTI_CLASS_CROSS_ENTROPY() + return loss_fn, optimizer + + @convert_to_3d_torch_array + def _fit_model(self, ts: InputData): + loss_fn, optimizer = self._init_model(ts) + train_loader, val_loader = self._prepare_data(ts, split_data=True) + self._train_loop( + train_loader=train_loader, + val_loader=val_loader, + loss_fn=loss_fn, + optimizer=optimizer + ) + From ace6626cae8b40c6489db63c3fa5566805efa9a8 Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 5 Jul 2024 12:30:52 +0300 Subject: [PATCH 11/43] mlstm registered --- .../architecture/abstraction/decorators.py | 4 +- fedot_ind/core/models/early_tc/ecec.py | 62 ++++--- .../core/models/nn/network_impl/mlstm.py | 154 ++++++++++++++++++ .../data/default_operation_params.json | 4 + .../data/industrial_model_repository.json | 6 + fedot_ind/core/repository/model_repository.py | 5 +- 6 files changed, 210 insertions(+), 25 deletions(-) diff --git a/fedot_ind/core/architecture/abstraction/decorators.py b/fedot_ind/core/architecture/abstraction/decorators.py index a9226ba0b..e34aa52a9 100644 --- a/fedot_ind/core/architecture/abstraction/decorators.py +++ b/fedot_ind/core/architecture/abstraction/decorators.py @@ -42,13 +42,13 @@ def decorated_func(self, *args): def convert_to_3d_torch_array(func): def decorated_func(self, *args): - init_data = args[0] + init_data, *args = args data = DataConverter(data=init_data).convert_to_torch_format() if isinstance(init_data, InputData): init_data.features = data else: init_data = data - return func(self, init_data, args[1]) + return func(self, init_data, *args) return decorated_func diff --git a/fedot_ind/core/models/early_tc/ecec.py b/fedot_ind/core/models/early_tc/ecec.py index a00df631d..45f7f9fe4 100644 --- a/fedot_ind/core/models/early_tc/ecec.py +++ b/fedot_ind/core/models/early_tc/ecec.py @@ -12,26 +12,53 @@ def __init__(self, params: Optional[OperationParameters] = None): def _init_model(self, X, y): super()._init_model(X, y) - self._confidences = np.ones((X.shape[0], self.n_pred)) + self._reliabilities = np.zeros((self.n_pred, self.n_classes, self.n_classes)) + + def _predict_one_slave(self, X, i, offset=0): + predicted_probas, predicted_labels = super()._predict_one_slave(X, i, offset) + reliabilities = self._reliabilities[i, predicted_labels, predicted_labels].flatten() # n_inst + return predicted_labels.astype(int), predicted_probas, reliabilities + + def _predict(self, X, training=False): + predicted_labels, predicted_probas, reliabilities = super()._predict(X, training) + reliabilities = np.stack(reliabilities) + confidences = 1 - np.cumprod(1 - reliabilities, axis=0) + non_confident = confidences < self.confidence_thresholds[:len(predicted_labels), None] + return predicted_labels, predicted_probas, non_confident, confidences - def _score(self, X, y, alpha): + def predict(self, X): + predicted_labels, _, non_confident, confidences = self._predict(X) + predicted_labels = np.stack(predicted_labels) + predicted_labels[non_confident] = -1 + return predicted_labels, confidences + + def predict_proba(self, X): + _, predicted_probas, non_confident, confidences = self._predict(X) + predicted_probas = np.stack(predicted_probas) + predicted_probas[non_confident] = -1 + return predicted_probas, confidences + + def _score(self, X, y, alpha, training=False): y = y.astype(int) - predicted_labels = np.stack(super()._predict(X)[0]).astype(int) # n_pred x n_inst + predicted_labels, *_ = super()._predict(X, training) # n_pred x n_inst + predicted_labels = np.stack(predicted_labels) n = predicted_labels.shape[0] - accuracies = (predicted_labels == np.tile(y, (1, n))) # n_pred x n_inst + accuracies = (predicted_labels == np.tile(y, (n, 1))) # n_pred x n_inst confidences = np.ones((n, X.shape[0]), dtype='float32') for i in range(n): y_pred = predicted_labels[i] reliability_i = confusion_matrix(y, y_pred, normalize='pred') confidences[i] = 1 - reliability_i[y, y_pred] # n_inst + self._reliabilities[i] = reliability_i confidences = 1 - np.cumprod(confidences, axis=0) # n_pred x n_inst candidates = self._select_thrs(confidences) # n_candidates - cfs = np.zeros_like(candidates) + cfs = np.zeros((len(candidates), n)) for i, candidate in enumerate(candidates): mask = confidences >= candidate # n_pred x n_inst accuracy_for_candidate = (accuracies * mask).sum(1) / mask.sum(1) # n_pred cfs[i] = self.cost_func(self.earliness, accuracy_for_candidate, alpha) - return candidates[np.argmin(cfs)] + self._best_estimator_idx = np.argmin(cfs.mean(0)) + return candidates[np.argmin(cfs, axis=0)] # n_pred @staticmethod def _select_thrs(confidences): @@ -39,24 +66,15 @@ def _select_thrs(confidences): difference = np.diff(C) pair_means = C[:-1] + difference / 2 difference_shifted = np.roll(difference, 1) - difference_idx = np.argwhere(difference > difference_shifted) - return pair_means[difference_idx].flatten() + difference_idx = np.argwhere(difference <= difference_shifted) + means_candidates = pair_means[difference_idx].flatten() + return means_candidates if len(means_candidates) else C @staticmethod def cost_func(earliness, accuracies, alpha): - return alpha * accuracies + (1 - alpha) * earliness + return alpha * (1 - accuracies) + (1 - alpha) * earliness def fit(self, X, y): - self.confidence_threshold = super().fit(X, y) - - - - - - - - - - - - + super().fit(X, y) + self.confidence_thresholds = self._score(X, y, self.accuracy_importance, training=True) + \ No newline at end of file diff --git a/fedot_ind/core/models/nn/network_impl/mlstm.py b/fedot_ind/core/models/nn/network_impl/mlstm.py index 31ca6fbd4..9a0a52ba6 100644 --- a/fedot_ind/core/models/nn/network_impl/mlstm.py +++ b/fedot_ind/core/models/nn/network_impl/mlstm.py @@ -125,3 +125,157 @@ def _fit_model(self, ts: InputData): optimizer=optimizer ) + +from fedot_ind.core.models.nn.network_impl.base_nn_model import BaseNeuralModel +from typing import Optional, Callable, Any, List, Union +from fedot.core.operations.operation_parameters import OperationParameters +from fedot.core.data.data import InputData, OutputData +from fedot_ind.core.repository.constanst_repository import CROSS_ENTROPY, MULTI_CLASS_CROSS_ENTROPY, RMSE +import torch.optim as optim +import torch.nn as nn +import torch.nn.functional as F +import torch +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array +import pandas as pd +from fedot.core.repository.tasks import Task, TaskTypesEnum, TsForecastingParams +from fedot_ind.core.models.nn.network_modules.layers.special import adjust_learning_rate, EarlyStopping +from fedot.core.repository.dataset_types import DataTypesEnum +from fedot_ind.core.architecture.preprocessing.data_convertor import DataConverter +import torch.utils.data as data +from fedot_ind.core.architecture.settings.computational import default_device + +class SqueezeExciteBlock(nn.Module): + def __init__(self, input_channels, filters, reduce=4): + super().__init__() + self.filters = filters + self.pool = nn.AvgPool1d(input_channels) + self.bottleneck = max(self.filters // reduce, 4) + self.fc1 = nn.Linear(self.filters, self.bottleneck, bias=False) + self.fc2 = nn.Linear(self.bottleneck, self.filters, bias=False) + torch.nn.init.kaiming_normal_(self.fc1.weight.data) + torch.nn.init.kaiming_normal_(self.fc2.weight.data) + + def forward(self, x): + input_x = x + x = self.pool(x) + x = F.relu(self.fc1(x.view(-1, 1, self.filters))) + x = F.sigmoid(self.fc2(x)) + x = x.view(-1, self.filters, 1) * input_x + return x + +class MLSTM_module(nn.Module): + def __init__(self, input_size, input_channels, + inner_size, inner_channels, + output_size, num_layers, dropout=0.25): + super().__init__() + self.proj = nn.Linear(input_size * inner_channels + input_channels * inner_size, output_size) + self.lstm = nn.LSTM(input_size, inner_size, num_layers, + batch_first=True, dropout=dropout) + self.conv_branch = nn.Sequential( + nn.Conv1d(input_channels, inner_channels, + padding='same', + kernel_size=9), + nn.BatchNorm1d(inner_channels), + nn.ReLU(), + SqueezeExciteBlock(input_size, inner_channels), + nn.Conv1d(inner_channels, inner_channels * 2, + padding='same', + kernel_size=5, + ), # c x l | n x c x l + nn.BatchNorm1d(inner_channels * 2), # n x c | n x c x l + nn.ReLU(), + SqueezeExciteBlock(input_size, inner_channels * 2), + nn.Conv1d(inner_channels * 2, inner_channels, + padding='same', + kernel_size=3, + ), # c x l | n x c x l + nn.BatchNorm1d(inner_channels), # n x c | n x c x l + nn.ReLU(), + ) + seq = next(iter(self.conv_branch.modules())) + idx = [0, 4, 8] + for i in idx: + torch.nn.init.kaiming_uniform_(seq[i].weight.data) + + def forward(self, x, hidden_state=None): + x_lstm, hidden_state = self.lstm(x, hidden_state) # n x input_ch x inner_size + x_conv = self.conv_branch(x) # n x inner_ch x len + x = torch.cat([torch.flatten(x_lstm, start_dim=1), torch.flatten(x_conv, start_dim=1)], dim=-1) + x = F.softmax(self.proj(x)) + return x#, hidden_state + + def augment_zero_padding(self, X: torch.Tensor): + res = [] + for i in self.prediction_idx: + zeroed_X = X[...] + zeroed_X[..., i + 1:] = 0 + res.append(zeroed_X) + res = torch.concat(res, 0) + return res[torch.randperm(res.size(0)), ...] + +class MLSTM(BaseNeuralModel): + def __init__(self, params: Optional[OperationParameters] = None): + if params is None: + params = {} + super().__init__() + # self.num_classes = params.get('num_classes', None) + # self.epochs = params.get('epochs', 100) + # self.batch_size = params.get('batch_size', 16) + # self.activation = params.get('activation', 'ReLU') + # self.learning_rate = 0.001 + + self.dropout = params.get('dropout', 0.25) + self.hidden_size = params.get('hidden_size', 64) + self.hidden_channels = params.get('hidden_channels', 32) + self.num_layers = params.get('num_layers', 2) + # self.target = None + # self.task_type = None + self.interval_percentage = params.get('interval_percentage', 10) + self.min_ts_length = params.get('min_ts_length', 5) + + def _compute_prediction_points(self, n_idx): + interval_length = max(int(n_idx * self.interval_percentage / 100), self.min_ts_length) + prediction_idx = np.arange(0, n_idx, interval_length) + self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 + return prediction_idx + + def _init_model(self, ts: InputData): + _, input_channels, input_size = ts.features.shape + self.prediction_idx = self._compute_prediction_points(input_size) + self.model = MLSTM_module(input_size, input_channels, + self.hidden_size, self.hidden_channels, + self.num_classes, self.num_layers, + self.dropout) + self.model_for_inference = MLSTM_module(input_size, input_channels, + self.hidden_size, self.hidden_channels, + self.num_classes, self.num_layers, + self.dropout) + optimizer = optim.Adam(self.model.parameters(), lr=0.001) + if ts.num_classes == 2: + loss_fn = CROSS_ENTROPY() + else: + loss_fn = MULTI_CLASS_CROSS_ENTROPY() + return loss_fn, optimizer + + def _train_loop(self, train_loader, val_loader, loss_fn, optimizer): + return super()._train_loop(train_loader, val_loader, loss_fn, optimizer) + + @convert_to_3d_torch_array + def _fit_model(self, ts: InputData): + if isinstance(ts, torch.Tensor): + ts = self.augment_zero_padding(ts) + else: + print(type(ts)) + loss_fn, optimizer = self._init_model(ts) + train_loader, val_loader = self._prepare_data(ts, split_data=True) + self._train_loop( + train_loader=train_loader, + val_loader=val_loader, + loss_fn=loss_fn, + optimizer=optimizer + ) + + + + diff --git a/fedot_ind/core/repository/data/default_operation_params.json b/fedot_ind/core/repository/data/default_operation_params.json index 52536d5cb..b875c3225 100644 --- a/fedot_ind/core/repository/data/default_operation_params.json +++ b/fedot_ind/core/repository/data/default_operation_params.json @@ -172,6 +172,10 @@ "learning_rate": "constant", "solver": "adam" }, + "mlstm_model": { + "epochs": 100, + "batch_size": 16 + }, "ar": { "lag_1": 7, "lag_2": 12, diff --git a/fedot_ind/core/repository/data/industrial_model_repository.json b/fedot_ind/core/repository/data/industrial_model_repository.json index 309d5c56c..0823954a2 100644 --- a/fedot_ind/core/repository/data/industrial_model_repository.json +++ b/fedot_ind/core/repository/data/industrial_model_repository.json @@ -282,6 +282,12 @@ "automl" ] }, + "mlstm_model": { + "meta": "fedot_NN_classification", + "presets": ["ts"], + "tags": [], + "input_type": "[DataTypesEnum.table]" + }, "xcm_model": { "meta": "fedot_NN_classification", "presets": [ diff --git a/fedot_ind/core/repository/model_repository.py b/fedot_ind/core/repository/model_repository.py index 908622195..9777b81c1 100644 --- a/fedot_ind/core/repository/model_repository.py +++ b/fedot_ind/core/repository/model_repository.py @@ -53,6 +53,7 @@ from fedot_ind.core.models.nn.network_impl.inception import InceptionTimeModel from fedot_ind.core.models.nn.network_impl.lora_nn import LoraModel from fedot_ind.core.models.nn.network_impl.mini_rocket import MiniRocketExtractor +from fedot_ind.core.models.nn.network_impl.mlstm import MLSTM from fedot_ind.core.models.nn.network_impl.nbeats import NBeatsModel from fedot_ind.core.models.nn.network_impl.omni_scale import OmniScaleModel from fedot_ind.core.models.nn.network_impl.resnet import ResNetModel @@ -221,7 +222,9 @@ class AtomizedModel(Enum): # linear_dummy_model 'dummy': DummyOverComplicatedNeuralNetwork, # linear_dummy_model - 'lora_model': LoraModel + 'lora_model': LoraModel, + # early ts classification + 'mlstm_model': MLSTM } From 42ba3f00fee57838534e5f48536e4295ca4773ce Mon Sep 17 00:00:00 2001 From: leostre Date: Tue, 9 Jul 2024 14:33:24 +0300 Subject: [PATCH 12/43] fitting w augmentation --- .../architecture/abstraction/decorators.py | 9 +- .../models/nn/network_impl/base_nn_model.py | 6 +- .../core/models/nn/network_impl/mlstm.py | 201 ++++-------------- 3 files changed, 55 insertions(+), 161 deletions(-) diff --git a/fedot_ind/core/architecture/abstraction/decorators.py b/fedot_ind/core/architecture/abstraction/decorators.py index e34aa52a9..f21218cd1 100644 --- a/fedot_ind/core/architecture/abstraction/decorators.py +++ b/fedot_ind/core/architecture/abstraction/decorators.py @@ -11,9 +11,10 @@ def fedot_data_type(func): def decorated_func(self, *args): - if not isinstance(args[0], InputData): - args[0] = DataConverter(data=args[0]) - features = args[0].features + data, *rest_args = args + if not isinstance(data, InputData): + data = DataConverter(data=data) + features = data.features if len(features.shape) < 4: try: @@ -22,7 +23,7 @@ def decorated_func(self, *args): input_data_squeezed = np.squeeze(features) else: input_data_squeezed = features - return func(self, input_data_squeezed, args[1]) + return func(self, input_data_squeezed, *rest_args) return decorated_func diff --git a/fedot_ind/core/models/nn/network_impl/base_nn_model.py b/fedot_ind/core/models/nn/network_impl/base_nn_model.py index a29fc694b..ff688fed9 100644 --- a/fedot_ind/core/models/nn/network_impl/base_nn_model.py +++ b/fedot_ind/core/models/nn/network_impl/base_nn_model.py @@ -78,7 +78,7 @@ def _fit_model(self, ts: InputData): def _init_model(self, ts) -> tuple: NotImplementedError() - def _prepare_data(self, ts, split_data: bool = True): + def _prepare_data(self, ts, split_data: bool = True, collate_fn=None): if split_data: train_data, val_data = train_test_data_setup( @@ -90,13 +90,13 @@ def _prepare_data(self, ts, split_data: bool = True): val_dataset = None train_loader = torch.utils.data.DataLoader( - train_dataset, batch_size=self.batch_size, shuffle=True) + train_dataset, batch_size=self.batch_size, shuffle=True, collate_fn=collate_fn) if val_dataset is None: val_loader = val_dataset else: val_loader = torch.utils.data.DataLoader( - val_dataset, batch_size=self.batch_size, shuffle=True) + val_dataset, batch_size=self.batch_size, shuffle=True, collate_fn=collate_fn) self.label_encoder = train_dataset.label_encoder return train_loader, val_loader diff --git a/fedot_ind/core/models/nn/network_impl/mlstm.py b/fedot_ind/core/models/nn/network_impl/mlstm.py index 9a0a52ba6..612d2b11b 100644 --- a/fedot_ind/core/models/nn/network_impl/mlstm.py +++ b/fedot_ind/core/models/nn/network_impl/mlstm.py @@ -4,11 +4,13 @@ from fedot.core.data.data import InputData, OutputData from fedot_ind.core.repository.constanst_repository import CROSS_ENTROPY, MULTI_CLASS_CROSS_ENTROPY, RMSE import torch.optim as optim +from torch.optim import lr_scheduler import torch.nn as nn import torch.nn.functional as F import torch +from tqdm import tqdm from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array +from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array, fedot_data_type import pandas as pd from fedot.core.repository.tasks import Task, TaskTypesEnum, TsForecastingParams from fedot_ind.core.models.nn.network_modules.layers.special import adjust_learning_rate, EarlyStopping @@ -70,149 +72,19 @@ def __init__(self, input_size, input_channels, for i in idx: torch.nn.init.kaiming_uniform_(seq[i].weight.data) - def forward(self, x): - x_lstm, _ = self.lstm(x) # n x input_ch x inner_size - x_conv = self.conv_branch(x) # n x inner_ch x len - print(x_conv.size(), x_lstm.size()) - x = torch.cat([torch.flatten(x_lstm, start_dim=1), torch.flatten(x_conv, start_dim=1)], dim=-1) - x = F.softmax(self.proj(x)) - return x - - -class MLSTM(BaseNeuralModel): - def __init__(self, params: Optional[OperationParameters] = None): - if params is None: - params = {} - super().__init__() - # self.num_classes = params.get('num_classes', None) - # self.epochs = params.get('epochs', 100) - # self.batch_size = params.get('batch_size', 16) - # self.activation = params.get('activation', 'ReLU') - # self.learning_rate = 0.001 - - self.dropout = params.get('dropout', 0.25) - self.hidden_size = params.get('hidden_size', 64) - self.hidden_channels = params.get('hidden_channels', 32) - self.num_layers = params.get('num_layers', 2) - # self.target = None - # self.task_type = None - - def _init_model(self, ts: InputData): - _, input_channels, input_size = ts.features.shape - self.model = MLSTM_module(input_size, input_channels, - self.hidden_size, self.hidden_channels, - self.num_classes, self.num_layers, - self.dropout) - self.model_for_inference = MLSTM_module(input_size, input_channels, - self.hidden_size, self.hidden_channels, - self.num_classes, self.num_layers, - self.dropout) - optimizer = optim.Adam(self.model.parameters(), lr=0.001) - if ts.num_classes == 2: - loss_fn = CROSS_ENTROPY() - else: - loss_fn = MULTI_CLASS_CROSS_ENTROPY() - return loss_fn, optimizer - - @convert_to_3d_torch_array - def _fit_model(self, ts: InputData): - loss_fn, optimizer = self._init_model(ts) - train_loader, val_loader = self._prepare_data(ts, split_data=True) - self._train_loop( - train_loader=train_loader, - val_loader=val_loader, - loss_fn=loss_fn, - optimizer=optimizer - ) - - -from fedot_ind.core.models.nn.network_impl.base_nn_model import BaseNeuralModel -from typing import Optional, Callable, Any, List, Union -from fedot.core.operations.operation_parameters import OperationParameters -from fedot.core.data.data import InputData, OutputData -from fedot_ind.core.repository.constanst_repository import CROSS_ENTROPY, MULTI_CLASS_CROSS_ENTROPY, RMSE -import torch.optim as optim -import torch.nn as nn -import torch.nn.functional as F -import torch -from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array -import pandas as pd -from fedot.core.repository.tasks import Task, TaskTypesEnum, TsForecastingParams -from fedot_ind.core.models.nn.network_modules.layers.special import adjust_learning_rate, EarlyStopping -from fedot.core.repository.dataset_types import DataTypesEnum -from fedot_ind.core.architecture.preprocessing.data_convertor import DataConverter -import torch.utils.data as data -from fedot_ind.core.architecture.settings.computational import default_device - -class SqueezeExciteBlock(nn.Module): - def __init__(self, input_channels, filters, reduce=4): - super().__init__() - self.filters = filters - self.pool = nn.AvgPool1d(input_channels) - self.bottleneck = max(self.filters // reduce, 4) - self.fc1 = nn.Linear(self.filters, self.bottleneck, bias=False) - self.fc2 = nn.Linear(self.bottleneck, self.filters, bias=False) - torch.nn.init.kaiming_normal_(self.fc1.weight.data) - torch.nn.init.kaiming_normal_(self.fc2.weight.data) - - def forward(self, x): - input_x = x - x = self.pool(x) - x = F.relu(self.fc1(x.view(-1, 1, self.filters))) - x = F.sigmoid(self.fc2(x)) - x = x.view(-1, self.filters, 1) * input_x - return x - -class MLSTM_module(nn.Module): - def __init__(self, input_size, input_channels, - inner_size, inner_channels, - output_size, num_layers, dropout=0.25): - super().__init__() - self.proj = nn.Linear(input_size * inner_channels + input_channels * inner_size, output_size) - self.lstm = nn.LSTM(input_size, inner_size, num_layers, - batch_first=True, dropout=dropout) - self.conv_branch = nn.Sequential( - nn.Conv1d(input_channels, inner_channels, - padding='same', - kernel_size=9), - nn.BatchNorm1d(inner_channels), - nn.ReLU(), - SqueezeExciteBlock(input_size, inner_channels), - nn.Conv1d(inner_channels, inner_channels * 2, - padding='same', - kernel_size=5, - ), # c x l | n x c x l - nn.BatchNorm1d(inner_channels * 2), # n x c | n x c x l - nn.ReLU(), - SqueezeExciteBlock(input_size, inner_channels * 2), - nn.Conv1d(inner_channels * 2, inner_channels, - padding='same', - kernel_size=3, - ), # c x l | n x c x l - nn.BatchNorm1d(inner_channels), # n x c | n x c x l - nn.ReLU(), - ) - seq = next(iter(self.conv_branch.modules())) - idx = [0, 4, 8] - for i in idx: - torch.nn.init.kaiming_uniform_(seq[i].weight.data) - - def forward(self, x, hidden_state=None): + def forward(self, x, hidden_state=None, return_hidden_state=False): + # hidden_state = hidden_state or self.hidden_state + if not self.training: + print(x.shape) x_lstm, hidden_state = self.lstm(x, hidden_state) # n x input_ch x inner_size x_conv = self.conv_branch(x) # n x inner_ch x len x = torch.cat([torch.flatten(x_lstm, start_dim=1), torch.flatten(x_conv, start_dim=1)], dim=-1) x = F.softmax(self.proj(x)) + # self.hidden_state = hidden_state + if return_hidden_state: + return x, hidden_state return x#, hidden_state - def augment_zero_padding(self, X: torch.Tensor): - res = [] - for i in self.prediction_idx: - zeroed_X = X[...] - zeroed_X[..., i + 1:] = 0 - res.append(zeroed_X) - res = torch.concat(res, 0) - return res[torch.randperm(res.size(0)), ...] class MLSTM(BaseNeuralModel): def __init__(self, params: Optional[OperationParameters] = None): @@ -229,11 +101,19 @@ def __init__(self, params: Optional[OperationParameters] = None): self.hidden_size = params.get('hidden_size', 64) self.hidden_channels = params.get('hidden_channels', 32) self.num_layers = params.get('num_layers', 2) - # self.target = None - # self.task_type = None self.interval_percentage = params.get('interval_percentage', 10) self.min_ts_length = params.get('min_ts_length', 5) + def __repr__(self): + return 'MLSTM' + + @convert_to_3d_torch_array + def _predict_model(self, ts: InputData, output_mode='default'): + self.model.eval() + x_test = torch.Tensor(ts).to(self._device) + pred = self.model(x_test) + return self._convert_predict(pred, output_mode) + def _compute_prediction_points(self, n_idx): interval_length = max(int(n_idx * self.interval_percentage / 100), self.min_ts_length) prediction_idx = np.arange(0, n_idx, interval_length) @@ -241,7 +121,7 @@ def _compute_prediction_points(self, n_idx): return prediction_idx def _init_model(self, ts: InputData): - _, input_channels, input_size = ts.features.shape + *_, input_channels, input_size = ts.features.shape self.prediction_idx = self._compute_prediction_points(input_size) self.model = MLSTM_module(input_size, input_channels, self.hidden_size, self.hidden_channels, @@ -255,27 +135,40 @@ def _init_model(self, ts: InputData): if ts.num_classes == 2: loss_fn = CROSS_ENTROPY() else: - loss_fn = MULTI_CLASS_CROSS_ENTROPY() + loss_fn = CROSS_ENTROPY() return loss_fn, optimizer - def _train_loop(self, train_loader, val_loader, loss_fn, optimizer): - return super()._train_loop(train_loader, val_loader, loss_fn, optimizer) + # @convert_to_3d_torch_array + # def predict(self, ts: InputData, output_mode: str = 'default'): + # return super().predict(ts, output_mode) + + # def predict_for_fit(self, ts: InputData, output_mode: str = 'default'): + # return super().predict_for_fit(ts, output_mode) @convert_to_3d_torch_array - def _fit_model(self, ts: InputData): - if isinstance(ts, torch.Tensor): - ts = self.augment_zero_padding(ts) - else: - print(type(ts)) + def _fit_model(self, ts: InputData, mode='zero_padding'): + self.epochs = 1 # !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!1 loss_fn, optimizer = self._init_model(ts) - train_loader, val_loader = self._prepare_data(ts, split_data=True) + + train_loader, val_loader = self._prepare_data(ts, split_data=False, + collate_fn=getattr(self, '_augment_zero_padding')) self._train_loop( train_loader=train_loader, val_loader=val_loader, loss_fn=loss_fn, - optimizer=optimizer + optimizer=optimizer, ) - - - + def _augment_zero_padding(self, batch,): + prediction_idx = self.prediction_idx + x, y = zip(*batch) + X, y = torch.stack(x), torch.stack(y) + y = np.tile(y, (len(prediction_idx), 1)) + res = [] + for i in prediction_idx: + zeroed_X = X[...] + zeroed_X[..., i + 1:] = 0 + res.append(zeroed_X) + res = np.concatenate(res, 0) + perm = np.random.permutation(res.shape[0]) + return torch.tensor(res[perm, ...]), torch.tensor(y[perm]) From 5d9182ecbe2444389da61709da665b77f0f1e53e Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 12 Jul 2024 01:27:24 +0300 Subject: [PATCH 13/43] all work, but need eval --- .../core/models/early_tc/base_early_tc.py | 3 + fedot_ind/core/models/early_tc/ecec.py | 61 +++++++++++++------ fedot_ind/core/models/early_tc/economy_k.py | 21 +++++-- .../core/models/early_tc/prob_threshold.py | 29 ++++++--- fedot_ind/core/models/early_tc/teaser.py | 19 ++++-- 5 files changed, 93 insertions(+), 40 deletions(-) diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index 5e180c2a9..38e5fd23f 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -71,6 +71,9 @@ def _select_estimators(self, X, training=False): elif training or self.prediction_mode == 'all': last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) estimator_indices = np.arange(last_idx + 1) + elif 'last_available': + last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) + estimator_indices = [last_idx] else: raise ValueError('Unknown prediction mode') return estimator_indices, offset diff --git a/fedot_ind/core/models/early_tc/ecec.py b/fedot_ind/core/models/early_tc/ecec.py index 45f7f9fe4..00962a233 100644 --- a/fedot_ind/core/models/early_tc/ecec.py +++ b/fedot_ind/core/models/early_tc/ecec.py @@ -9,6 +9,7 @@ class ECEC(BaseETC): def __init__(self, params: Optional[OperationParameters] = None): super().__init__(params) + self.__cv = 5 def _init_model(self, X, y): super()._init_model(X, y) @@ -30,34 +31,39 @@ def predict(self, X): predicted_labels, _, non_confident, confidences = self._predict(X) predicted_labels = np.stack(predicted_labels) predicted_labels[non_confident] = -1 - return predicted_labels, confidences + if self.transform_score: + confidences = self._transform_score(confidences) + return self._remove_first_1d(predicted_labels, confidences) def predict_proba(self, X): _, predicted_probas, non_confident, confidences = self._predict(X) predicted_probas = np.stack(predicted_probas) predicted_probas[non_confident] = -1 - return predicted_probas, confidences + if self.transform_score: + confidences = self._transform_score(confidences) + return self._remove_first_1d(predicted_probas, confidences) + + def _fit_one_interval(self, X, y, i): + X_part = X[..., :self.prediction_idx[i] + 1] + X_part = self.scalers[i].fit_transform(X_part) + self.slave_estimators[i].fit(X_part, y) + labels = cross_val_predict(self.slave_estimators[i], X_part, y, cv=self.__cv) + return labels - def _score(self, X, y, alpha, training=False): - y = y.astype(int) - predicted_labels, *_ = super()._predict(X, training) # n_pred x n_inst - predicted_labels = np.stack(predicted_labels) - n = predicted_labels.shape[0] - accuracies = (predicted_labels == np.tile(y, (n, 1))) # n_pred x n_inst - confidences = np.ones((n, X.shape[0]), dtype='float32') - for i in range(n): - y_pred = predicted_labels[i] - reliability_i = confusion_matrix(y, y_pred, normalize='pred') - confidences[i] = 1 - reliability_i[y, y_pred] # n_inst - self._reliabilities[i] = reliability_i - confidences = 1 - np.cumprod(confidences, axis=0) # n_pred x n_inst + def _score(self, y, y_pred, alpha): + matches = (y_pred == np.tile(y, (self.n_pred, 1))) # n_pred x n_inst + n, n_inst = matches.shape[:2] + confidences = np.ones((n, n_inst), dtype='float32') + for i in range(self.n_pred): + confidences[i] = self._reliabilities[i, y, y_pred[i]] + confidences = 1 - np.cumprod(1 - confidences, axis=0) # n_pred x n_inst candidates = self._select_thrs(confidences) # n_candidates cfs = np.zeros((len(candidates), n)) for i, candidate in enumerate(candidates): mask = confidences >= candidate # n_pred x n_inst - accuracy_for_candidate = (accuracies * mask).sum(1) / mask.sum(1) # n_pred + accuracy_for_candidate = (matches * mask).sum(1) / mask.sum(1) # n_pred cfs[i] = self.cost_func(self.earliness, accuracy_for_candidate, alpha) - self._best_estimator_idx = np.argmin(cfs.mean(0)) + self._chosen_estimator_idx = np.argmin(cfs.mean(0)) return candidates[np.argmin(cfs, axis=0)] # n_pred @staticmethod @@ -75,6 +81,23 @@ def cost_func(earliness, accuracies, alpha): return alpha * (1 - accuracies) + (1 - alpha) * earliness def fit(self, X, y): - super().fit(X, y) - self.confidence_thresholds = self._score(X, y, self.accuracy_importance, training=True) + y = np.array(y).flatten().astype(int) + self._init_model(X, y) + labels = [] + for i in range(self.n_pred): + labels.append(self._fit_one_interval(X, y, i)) + predicted_labels = np.stack(labels) + for i in range(self.n_pred): + y_pred = predicted_labels[i] + reliability_i = confusion_matrix(y, y_pred, normalize='pred') + self._reliabilities[i] = reliability_i + self.confidence_thresholds = self._score(y, predicted_labels, self.accuracy_importance) + + def _transform_score(self, confidences): + thr = self.confidence_thresholds[self._estimator_for_predict[-1]] + confidences = confidences - thr + positive = confidences > 0 + confidences[positive] *= 1 / (1 - thr) + confidences[~positive] *= 1 / thr + return confidences \ No newline at end of file diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py index 639e680cd..8eb207550 100644 --- a/fedot_ind/core/models/early_tc/economy_k.py +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -11,8 +11,10 @@ def __init__(self, params: Optional[OperationParameters] = None): if params is None: params = {} super().__init__(params) + self.prediction_mode = params.get('prediction_mode', 'last_available') self.lambda_ = params.get('lambda', 1.) self._cluster_factor = params.get('cluster_factor' , 1) + # self.confidence_mode = params.get('confidence_mode', 'time') # or 'confidence' self._random_state = 2104 self.__cv = 5 @@ -77,13 +79,20 @@ def _get_prediction_time(self, X, cluster_centroids, i): def predict_proba(self, X): probas, times, is_optimal = self._predict(X) is_optimal = np.stack(is_optimal) - idx = np.tile(np.arange(self.n_pred), (is_optimal.shape[1], 1)).T # n_pred x n_inst - idx[~is_optimal] = self.n_pred - idx = np.argmin(idx, 0) - probas = np.stack(probas) - return probas[idx], np.stack(times)[idx] + probas, times = np.stack(probas), np.stack(times) + if self.transform_score: + times = self._transform_score(times) + return self._remove_first_1d(probas, times) def predict(self, X): probas, times = self.predict_proba(X) labels = probas.argmax(-1) - return labels, times + return self._remove_first_1d(labels, times) + + def _transform_score(self, time): + idx = self._estimator_for_predict[-1] + scores = -(1 - (time - self.prediction_idx[idx]) / self.prediction_idx[-1]) + scores[scores == 0] = 1 # no posibility for lininterp when sure + return scores + + diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index 51d169909..8dcb8828f 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -7,7 +7,7 @@ class ProbabilityThresholdClassifier(BaseETC): def __init__(self, params: Optional[OperationParameters] = None): if params is None: params = {} - super().__init__() + super().__init__(params) self.probability_threshold = params.get('probability_threshold', None) def _init_model(self, X, y): @@ -18,19 +18,23 @@ def _init_model(self, X, y): def predict_proba(self, X): _, predicted_probas, non_acceptance = self._predict(X) predicted_probas[non_acceptance] = 0 - return predicted_probas.squeeze() + scores = predicted_probas.max(-1) + if self.transform_score: + scores = self._transform_score(scores) + return self._remove_first_1d(predicted_probas, scores) def predict(self, X): - predicted_labels, _, non_acceptance = self._predict(X, training=False) + predicted_labels, predicted_probas, non_acceptance = self._predict(X, training=False) predicted_labels[non_acceptance] = -1 - # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] - return predicted_labels # prediction_points x n_instances + scores = predicted_probas.max(-1) + if self.transform_score: + scores = self._transform_score(scores) + return self._remove_first_1d(predicted_labels, scores) # (prediction_points x) n_instances def _predict(self, X, training=True): predicted_probas, predicted_labels = super()._predict(X, training) predicted_probas = np.stack(predicted_probas) predicted_labels = np.stack(predicted_labels) - # print(predicted_labels.shape, predicted_probas.shape) non_acceptance = self._consecutive_count(predicted_labels) < self.consecutive_predictions double_check = predicted_probas.max(axis=-1) > self.probability_threshold non_acceptance[non_acceptance & double_check] = False @@ -38,10 +42,17 @@ def _predict(self, X, training=True): def _score(self, X, y, accuracy_importance=None): scores = super()._score(X, y, accuracy_importance) - self._best_estimator_idx = np.argmax(scores) + self._chosen_estimator_idx = np.argmax(scores) return scores def fit(self, X, y): super().fit(X, y) - return self._score(X, y, self.accuracy_importance) - + self._score(X, y, self.accuracy_importance) + + def _transform_score(self, confidences): + thr = self.probability_threshold + confidences = confidences - thr + positive = confidences > 0 + confidences[positive] *= 1 / (1 - thr) + confidences[~positive] *= 1 / thr + return confidences diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 593a34e72..6ddc19a45 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -56,31 +56,38 @@ def _predict(self, X): # for each point of estimation for i in range(predicted_labels.shape[0]): # find not accepted points - ith_point_to_oc = to_oc_check[to_oc_check[:, 0] == i, 1] - X_to_ith = X_ocs[i][ith_point_to_oc] + X_to_ith = X_ocs[i] # if they are not outliers final_verdict = self.oc_estimators[estimator_indices[i]].decision_function(X_to_ith) # 1 for accept -1 for reject # mark as accepted - non_acceptance[i, np.argwhere(final_verdict >= 0).flatten()] = False + # non_acceptance[i, np.argwhere(final_verdict >= 0).flatten()] = False final_verdicts[i] = final_verdict + non_acceptance[non_acceptance & (final_verdict > 0)] = False return predicted_labels, predicted_probas, non_acceptance, final_verdicts def predict_proba(self, X): _, predicted_probas, non_acceptance, final_verdicts = self._predict(X) predicted_probas[non_acceptance] = final_verdicts[non_acceptance, None] - return predicted_probas.squeeze() + if self.transform_score: + final_verdicts = self._transform_score(final_verdicts) + return self._remove_first_1d(predicted_probas, final_verdicts) def predict(self, X): predicted_labels, _, non_acceptance, final_verdicts = self._predict(X) predicted_labels[non_acceptance] = -1 # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] - return predicted_labels # prediction_points x n_instances + if self.transform_score: + final_verdicts = self._transform_score(final_verdicts) + return self._remove_first_1d(predicted_labels, final_verdicts) # (prediction_points x) n_instances def _score(self, X, y, accuracy_importance=None): scores = super()._score(X, y, accuracy_importance) - self._best_estimator_idx = np.argmax(scores) + self._chosen_estimator_idx = np.argmax(scores) return scores def fit(self, X, y): super().fit(X, y) return self._score(X, y, self.accuracy_importance) + + def _transform_score(self, scores): + return np.tanh(scores) From 41c329c5bde01ce902ee831552103ab4aa350f05 Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 12 Jul 2024 12:09:39 +0300 Subject: [PATCH 14/43] evth converged to one interface + refactored --- .../core/models/early_tc/base_early_tc.py | 53 ++-- fedot_ind/core/models/early_tc/ecec.py | 18 +- fedot_ind/core/models/early_tc/economy_k.py | 15 +- .../core/models/early_tc/prob_threshold.py | 14 +- fedot_ind/core/models/early_tc/teaser.py | 23 +- .../core/models/nn/network_impl/mlstm.py | 235 ++++++++++++------ .../data/default_operation_params.json | 14 +- .../data/industrial_model_repository.json | 22 +- fedot_ind/core/repository/model_repository.py | 8 +- fedot_ind/core/tuning/search_space.py | 32 ++- 10 files changed, 281 insertions(+), 153 deletions(-) diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index 38e5fd23f..9fbc162c5 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -11,10 +11,12 @@ def __init__(self, params: Optional[OperationParameters] = None): if params is None: params = {} super().__init__() - self.prediction_mode = params.get('prediction_mode', 'best_by_harmonic_mean') self.interval_percentage = params.get('interval_percentage', 10) - self.consecutive_predictions = params.get('consecutive_predictions', 3) + self.consecutive_predictions = params.get('consecutive_predictions', 1) self.accuracy_importance = params.get('accuracy_importance', 1.) + + self.prediction_mode = params.get('prediction_mode', 'last_available') + self.transform_score = params.get('transform_score', True) self.min_ts_length = params.get('min_ts_step', 3) self.random_state = params.get('random_state', None) self.weasel_params = {} @@ -26,14 +28,15 @@ def _init_model(self, X, y): self.n_pred = len(self.prediction_idx) self.slave_estimators = [WEASEL(random_state=self.random_state, support_probabilities=True, **self.weasel_params) for _ in range(self.n_pred)] self.scalers = [StandardScaler() for _ in range(self.n_pred)] - self._best_estimator_idx = -1 + self._chosen_estimator_idx = -1 self.classes_ = [np.unique(y)] + self._estimator_for_predict = [-1] @property def required_length(self): - if not hasattr(self, '_best_estimator_idx'): + if not hasattr(self, '_chosen_estimator_idx'): return None - return self.prediction_idx[self._best_estimator_idx] + return self.prediction_idx[self._chosen_estimator_idx] @property def n_classes(self): @@ -47,7 +50,7 @@ def fit(self, X, y=None): self._fit_one_interval(X, y, i) def _fit_one_interval(self, X, y, i): - X_part = X[..., :self.prediction_idx[i] + 1] # what's dimensionality of input? will it work in case of multivariate? + X_part = X[..., :self.prediction_idx[i] + 1] X_part = self.scalers[i].fit_transform(X_part) probas = self.slave_estimators[i].fit_predict_proba(X_part, y) return probas @@ -67,19 +70,21 @@ def _compute_prediction_points(self, n_idx): def _select_estimators(self, X, training=False): offset = 0 if not training and self.prediction_mode == 'best_by_harmonic_mean': - estimator_indices = [self._best_estimator_idx] + estimator_indices = [self._chosen_estimator_idx] + elif not training and self.prediction_mode == 'last_available': + last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) + estimator_indices = [last_idx] elif training or self.prediction_mode == 'all': last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) estimator_indices = np.arange(last_idx + 1) - elif 'last_available': - last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) - estimator_indices = [last_idx] else: raise ValueError('Unknown prediction mode') return estimator_indices, offset def _predict(self, X, training=True): estimator_indices, offset = self._select_estimators(X, training) + if not training: + self._estimator_for_predict = estimator_indices prediction = zip( *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary ) @@ -94,20 +99,32 @@ def _consecutive_count(self, predicted_labels: List[np.array]): consecutive_labels[i, equal] = consecutive_labels[i - 1, equal] + 1 return consecutive_labels # prediction_points x n_instances - def predict_proba(self, X): - raise NotImplementedError + def predict_proba(self, *args): + predicted_probas, scores, *_ = args + if self.transform_score: + scores = self._transform_score(scores) + scores = np.tile(scores[..., None], (1, 1, self.n_classes)) + prediction = np.stack([predicted_probas, scores], axis=0) + if prediction.shape[1] == 1: + prediction = prediction.squeeze(1) + return prediction def predict(self, X): - raise NotImplementedError + prediction = self.predict_proba(X) + labels = prediction[0:1].argmax(-1) + scores = prediction[1:2, ..., 0] + prediction = np.stack([labels, scores], 0) + if prediction.shape[1] == 1: + prediction = prediction.squeeze(1) + return prediction - def _score(self, X, y, hm_shift_to_acc=None): + def _score(self, X, y, accuracy_importance=None, training=True): y = np.array(y).flatten() - hm_shift_to_acc = hm_shift_to_acc or self.accuracy_importance - predictions = self._predict(X)[0] + accuracy_importance = accuracy_importance or self.accuracy_importance + predictions = self._predict(X, training)[0] prediction_points = predictions.shape[0] accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) - return (1 + hm_shift_to_acc) * accuracies * self.earliness[:prediction_points] / (hm_shift_to_acc * accuracies + self.earliness[:prediction_points]) - + return (1 + accuracy_importance) * accuracies * self.earliness[:prediction_points] / (accuracy_importance * accuracies + self.earliness[:prediction_points]) def _get_applicable_index(self, last_available_idx): idx = np.searchsorted(self.prediction_idx, last_available_idx, side='right') diff --git a/fedot_ind/core/models/early_tc/ecec.py b/fedot_ind/core/models/early_tc/ecec.py index 00962a233..f6e163d25 100644 --- a/fedot_ind/core/models/early_tc/ecec.py +++ b/fedot_ind/core/models/early_tc/ecec.py @@ -3,7 +3,6 @@ from fedot.core.operations.operation_parameters import OperationParameters from fedot_ind.core.models.early_tc.base_early_tc import BaseETC from sklearn.model_selection import cross_val_predict -from sklearn.base import clone from sklearn.metrics import confusion_matrix class ECEC(BaseETC): @@ -25,23 +24,14 @@ def _predict(self, X, training=False): reliabilities = np.stack(reliabilities) confidences = 1 - np.cumprod(1 - reliabilities, axis=0) non_confident = confidences < self.confidence_thresholds[:len(predicted_labels), None] - return predicted_labels, predicted_probas, non_confident, confidences - - def predict(self, X): - predicted_labels, _, non_confident, confidences = self._predict(X) predicted_labels = np.stack(predicted_labels) - predicted_labels[non_confident] = -1 - if self.transform_score: - confidences = self._transform_score(confidences) - return self._remove_first_1d(predicted_labels, confidences) + predicted_probas = np.stack(predicted_probas) + return predicted_labels, predicted_probas, non_confident, confidences def predict_proba(self, X): _, predicted_probas, non_confident, confidences = self._predict(X) - predicted_probas = np.stack(predicted_probas) predicted_probas[non_confident] = -1 - if self.transform_score: - confidences = self._transform_score(confidences) - return self._remove_first_1d(predicted_probas, confidences) + return super().predict_proba(predicted_probas, confidences) def _fit_one_interval(self, X, y, i): X_part = X[..., :self.prediction_idx[i] + 1] @@ -52,7 +42,7 @@ def _fit_one_interval(self, X, y, i): def _score(self, y, y_pred, alpha): matches = (y_pred == np.tile(y, (self.n_pred, 1))) # n_pred x n_inst - n, n_inst = matches.shape[:2] + n, n_inst, *_ = matches.shape confidences = np.ones((n, n_inst), dtype='float32') for i in range(self.n_pred): confidences[i] = self._reliabilities[i, y, y_pred[i]] diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py index 8eb207550..bf09acd4b 100644 --- a/fedot_ind/core/models/early_tc/economy_k.py +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -4,7 +4,7 @@ from fedot_ind.core.models.early_tc.base_early_tc import BaseETC from sklearn.cluster import KMeans from sklearn.metrics import confusion_matrix -from sklearn.model_selection import train_test_split, cross_val_predict +from sklearn.model_selection import cross_val_predict class EconomyK(BaseETC): def __init__(self, params: Optional[OperationParameters] = None): @@ -14,7 +14,6 @@ def __init__(self, params: Optional[OperationParameters] = None): self.prediction_mode = params.get('prediction_mode', 'last_available') self.lambda_ = params.get('lambda', 1.) self._cluster_factor = params.get('cluster_factor' , 1) - # self.confidence_mode = params.get('confidence_mode', 'time') # or 'confidence' self._random_state = 2104 self.__cv = 5 @@ -77,17 +76,9 @@ def _get_prediction_time(self, X, cluster_centroids, i): return time_optimal, is_optimal # n_inst def predict_proba(self, X): - probas, times, is_optimal = self._predict(X) - is_optimal = np.stack(is_optimal) + probas, times, _ = self._predict(X, training=False) probas, times = np.stack(probas), np.stack(times) - if self.transform_score: - times = self._transform_score(times) - return self._remove_first_1d(probas, times) - - def predict(self, X): - probas, times = self.predict_proba(X) - labels = probas.argmax(-1) - return self._remove_first_1d(labels, times) + return super().predict_proba(probas, times) def _transform_score(self, time): idx = self._estimator_for_predict[-1] diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index 8dcb8828f..773f79d8e 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -16,20 +16,10 @@ def _init_model(self, X, y): self.probability_threshold = 1 / len(self.classes_[0]) def predict_proba(self, X): - _, predicted_probas, non_acceptance = self._predict(X) + _, predicted_probas, non_acceptance = self._predict(X, training=False) predicted_probas[non_acceptance] = 0 scores = predicted_probas.max(-1) - if self.transform_score: - scores = self._transform_score(scores) - return self._remove_first_1d(predicted_probas, scores) - - def predict(self, X): - predicted_labels, predicted_probas, non_acceptance = self._predict(X, training=False) - predicted_labels[non_acceptance] = -1 - scores = predicted_probas.max(-1) - if self.transform_score: - scores = self._transform_score(scores) - return self._remove_first_1d(predicted_labels, scores) # (prediction_points x) n_instances + return super().predict_proba(predicted_probas, scores) def _predict(self, X, training=True): predicted_probas, predicted_labels = super()._predict(X, training) diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 6ddc19a45..35328c535 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -1,9 +1,9 @@ from typing import Optional from fedot_ind.core.architecture.settings.computational import backend_methods as np -from sklearn.svm import OneClassSVM -from sklearn.model_selection import GridSearchCV from fedot.core.operations.operation_parameters import OperationParameters from fedot_ind.core.models.early_tc.base_early_tc import BaseETC +from sklearn.model_selection import GridSearchCV +from sklearn.svm import OneClassSVM class TEASER(BaseETC): @@ -13,6 +13,7 @@ def __init__(self, params: Optional[OperationParameters] = None): def _init_model(self, X, y): super()._init_model(X, y) + def _init_model(self, X, y): super()._init_model(X, y) self.oc_estimators = [None] * self.n_pred @@ -42,13 +43,12 @@ def _form_X_oc(self, predicted_probas): d = d.min(axis=-1).reshape(-1, 1) return np.hstack([predicted_probas, d]) - def _predict(self, X): + def _predict(self, X, training=False): estimator_indices, offset = self._select_estimators(X) X_ocs, predicted_probas, predicted_labels = zip( *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary ) non_acceptance = self._consecutive_count(predicted_labels) < self.consecutive_predictions - to_oc_check = np.argwhere(non_acceptance) X_ocs = np.stack(X_ocs) predicted_probas = np.stack(predicted_probas) predicted_labels = np.stack(predicted_labels) @@ -58,9 +58,8 @@ def _predict(self, X): # find not accepted points X_to_ith = X_ocs[i] # if they are not outliers - final_verdict = self.oc_estimators[estimator_indices[i]].decision_function(X_to_ith) # 1 for accept -1 for reject + final_verdict = self.oc_estimators[estimator_indices[i]].decision_function(X_to_ith) # mark as accepted - # non_acceptance[i, np.argwhere(final_verdict >= 0).flatten()] = False final_verdicts[i] = final_verdict non_acceptance[non_acceptance & (final_verdict > 0)] = False return predicted_labels, predicted_probas, non_acceptance, final_verdicts @@ -68,17 +67,7 @@ def _predict(self, X): def predict_proba(self, X): _, predicted_probas, non_acceptance, final_verdicts = self._predict(X) predicted_probas[non_acceptance] = final_verdicts[non_acceptance, None] - if self.transform_score: - final_verdicts = self._transform_score(final_verdicts) - return self._remove_first_1d(predicted_probas, final_verdicts) - - def predict(self, X): - predicted_labels, _, non_acceptance, final_verdicts = self._predict(X) - predicted_labels[non_acceptance] = -1 - # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] - if self.transform_score: - final_verdicts = self._transform_score(final_verdicts) - return self._remove_first_1d(predicted_labels, final_verdicts) # (prediction_points x) n_instances + return super().predict_proba(predicted_probas, final_verdicts) def _score(self, X, y, accuracy_importance=None): scores = super()._score(X, y, accuracy_importance) diff --git a/fedot_ind/core/models/nn/network_impl/mlstm.py b/fedot_ind/core/models/nn/network_impl/mlstm.py index 612d2b11b..3e1d3c4b5 100644 --- a/fedot_ind/core/models/nn/network_impl/mlstm.py +++ b/fedot_ind/core/models/nn/network_impl/mlstm.py @@ -1,23 +1,20 @@ +import copy from fedot_ind.core.models.nn.network_impl.base_nn_model import BaseNeuralModel from typing import Optional, Callable, Any, List, Union from fedot.core.operations.operation_parameters import OperationParameters from fedot.core.data.data import InputData, OutputData from fedot_ind.core.repository.constanst_repository import CROSS_ENTROPY, MULTI_CLASS_CROSS_ENTROPY, RMSE import torch.optim as optim -from torch.optim import lr_scheduler +import torch.optim.lr_scheduler as lr_scheduler import torch.nn as nn import torch.nn.functional as F import torch -from tqdm import tqdm +from tqdm import tqdm from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array, fedot_data_type +from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array import pandas as pd -from fedot.core.repository.tasks import Task, TaskTypesEnum, TsForecastingParams from fedot_ind.core.models.nn.network_modules.layers.special import adjust_learning_rate, EarlyStopping -from fedot.core.repository.dataset_types import DataTypesEnum -from fedot_ind.core.architecture.preprocessing.data_convertor import DataConverter import torch.utils.data as data -from fedot_ind.core.architecture.settings.computational import default_device class SqueezeExciteBlock(nn.Module): def __init__(self, input_channels, filters, reduce=4): @@ -46,20 +43,22 @@ def __init__(self, input_size, input_channels, self.proj = nn.Linear(input_size * inner_channels + input_channels * inner_size, output_size) self.lstm = nn.LSTM(input_size, inner_size, num_layers, batch_first=True, dropout=dropout) + + squeeze_excite_size = input_size #if not interval else interval self.conv_branch = nn.Sequential( nn.Conv1d(input_channels, inner_channels, padding='same', kernel_size=9), nn.BatchNorm1d(inner_channels), nn.ReLU(), - SqueezeExciteBlock(input_size, inner_channels), + SqueezeExciteBlock(squeeze_excite_size, inner_channels), nn.Conv1d(inner_channels, inner_channels * 2, padding='same', kernel_size=5, ), # c x l | n x c x l nn.BatchNorm1d(inner_channels * 2), # n x c | n x c x l nn.ReLU(), - SqueezeExciteBlock(input_size, inner_channels * 2), + SqueezeExciteBlock(squeeze_excite_size, inner_channels * 2), nn.Conv1d(inner_channels * 2, inner_channels, padding='same', kernel_size=3, @@ -72,103 +71,197 @@ def __init__(self, input_size, input_channels, for i in idx: torch.nn.init.kaiming_uniform_(seq[i].weight.data) - def forward(self, x, hidden_state=None, return_hidden_state=False): - # hidden_state = hidden_state or self.hidden_state - if not self.training: - print(x.shape) + def forward(self, x, hidden_state=None, return_hidden=False): x_lstm, hidden_state = self.lstm(x, hidden_state) # n x input_ch x inner_size x_conv = self.conv_branch(x) # n x inner_ch x len x = torch.cat([torch.flatten(x_lstm, start_dim=1), torch.flatten(x_conv, start_dim=1)], dim=-1) x = F.softmax(self.proj(x)) - # self.hidden_state = hidden_state - if return_hidden_state: + if return_hidden: return x, hidden_state - return x#, hidden_state - + return x + class MLSTM(BaseNeuralModel): def __init__(self, params: Optional[OperationParameters] = None): if params is None: params = {} super().__init__() - # self.num_classes = params.get('num_classes', None) - # self.epochs = params.get('epochs', 100) - # self.batch_size = params.get('batch_size', 16) - # self.activation = params.get('activation', 'ReLU') - # self.learning_rate = 0.001 - self.dropout = params.get('dropout', 0.25) self.hidden_size = params.get('hidden_size', 64) self.hidden_channels = params.get('hidden_channels', 32) self.num_layers = params.get('num_layers', 2) self.interval_percentage = params.get('interval_percentage', 10) self.min_ts_length = params.get('min_ts_length', 5) - + self.fitting_mode = params.get('fitting_mode', 'zero_padding') + self.proba_thr = params.get('proba_thr', None) + def __repr__(self): return 'MLSTM' - @convert_to_3d_torch_array - def _predict_model(self, ts: InputData, output_mode='default'): - self.model.eval() - x_test = torch.Tensor(ts).to(self._device) - pred = self.model(x_test) - return self._convert_predict(pred, output_mode) - def _compute_prediction_points(self, n_idx): interval_length = max(int(n_idx * self.interval_percentage / 100), self.min_ts_length) - prediction_idx = np.arange(0, n_idx, interval_length) + prediction_idx = np.arange(interval_length - 1, n_idx, interval_length) self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 - return prediction_idx + return prediction_idx, interval_length def _init_model(self, ts: InputData): - *_, input_channels, input_size = ts.features.shape - self.prediction_idx = self._compute_prediction_points(input_size) - self.model = MLSTM_module(input_size, input_channels, + _, input_channels, input_size = ts.features.shape + self.input_size = input_size + self.prediction_idx, self.interval = self._compute_prediction_points(input_size) + self.model = MLSTM_module(input_size if self.fitting_mode != 'moving_window' else self.interval, + input_channels, self.hidden_size, self.hidden_channels, self.num_classes, self.num_layers, self.dropout) - self.model_for_inference = MLSTM_module(input_size, input_channels, + self.model_for_inference = MLSTM_module(input_size if self.fitting_mode != 'moving_window' else self.interval, + input_channels, self.hidden_size, self.hidden_channels, self.num_classes, self.num_layers, self.dropout) optimizer = optim.Adam(self.model.parameters(), lr=0.001) - if ts.num_classes == 2: - loss_fn = CROSS_ENTROPY() - else: - loss_fn = CROSS_ENTROPY() + loss_fn = CROSS_ENTROPY() return loss_fn, optimizer - # @convert_to_3d_torch_array - # def predict(self, ts: InputData, output_mode: str = 'default'): - # return super().predict(ts, output_mode) - - # def predict_for_fit(self, ts: InputData, output_mode: str = 'default'): - # return super().predict_for_fit(ts, output_mode) - @convert_to_3d_torch_array - def _fit_model(self, ts: InputData, mode='zero_padding'): - self.epochs = 1 # !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!1 + def _fit_model(self, ts: InputData): + mode = self.fitting_mode loss_fn, optimizer = self._init_model(ts) + train_loader, val_loader = self._prepare_data(ts, split_data=True, + collate_fn=getattr(self, '_augment_with_zeros')) + if mode == 'zero_padding': + super()._train_loop( + train_loader=train_loader, + val_loader=val_loader, + loss_fn=loss_fn, + optimizer=optimizer + ) + elif mode == 'moving_window': + self._train_loop( + train_loader=train_loader, + val_loader=None, + loss_fn=loss_fn, + optimizer=optimizer + ) + else: + raise ValueError('Unknown fitting mode') + + def _moving_window_output(self, inputs): + hidden_state = None + output = -torch.ones((inputs.shape[0], self.num_classes)) + for i in self.prediction_idx: + if i >= inputs.shape[-1]: + break + batch_interval = inputs[..., i - self.prediction_idx[0] : i + 1] + output, hidden_state = self.model(batch_interval, hidden_state, return_hidden=True) + return output - train_loader, val_loader = self._prepare_data(ts, split_data=False, - collate_fn=getattr(self, '_augment_zero_padding')) - self._train_loop( - train_loader=train_loader, - val_loader=val_loader, - loss_fn=loss_fn, - optimizer=optimizer, - ) + def _train_loop(self, train_loader, val_loader, loss_fn, optimizer): + early_stopping = EarlyStopping() + scheduler = lr_scheduler.OneCycleLR(optimizer=optimizer, + steps_per_epoch=len(train_loader), + epochs=self.epochs, + max_lr=self.learning_rate) + if val_loader is None: + print('Not enough class samples for validation') + + best_model = None + best_val_loss = float('inf') + val_interval = self.get_validation_frequency( + self.epochs, self.learning_rate) - def _augment_zero_padding(self, batch,): - prediction_idx = self.prediction_idx - x, y = zip(*batch) - X, y = torch.stack(x), torch.stack(y) - y = np.tile(y, (len(prediction_idx), 1)) - res = [] - for i in prediction_idx: - zeroed_X = X[...] - zeroed_X[..., i + 1:] = 0 - res.append(zeroed_X) - res = np.concatenate(res, 0) - perm = np.random.permutation(res.shape[0]) - return torch.tensor(res[perm, ...]), torch.tensor(y[perm]) + for epoch in range(1, self.epochs + 1): + training_loss = 0.0 + valid_loss = 0.0 + self.model.train() + total = 0 + correct = 0 + for batch in tqdm(train_loader): + optimizer.zero_grad() + inputs, targets = batch + output = self._moving_window_output(inputs) + loss = loss_fn(output, targets.float()) + loss.backward() + optimizer.step() + training_loss += loss.data.item() * inputs.size(0) + total += targets.size(0) + correct += (torch.argmax(output, 1) == + torch.argmax(targets, 1)).sum().item() + + accuracy = correct / total + training_loss /= len(train_loader.dataset) + print('Epoch: {}, Accuracy = {}, Training Loss: {:.2f}'.format( + epoch, accuracy, training_loss)) + + if val_loader is not None and epoch % val_interval == 0: + self.model.eval() + total = 0 + correct = 0 + for batch in val_loader: + inputs, targets = batch + + output = self.model(inputs) + + loss = loss_fn(output, targets.float()) + + valid_loss += loss.data.item() * inputs.size(0) + total += targets.size(0) + correct += (torch.argmax(output, 1) == + torch.argmax(targets, 1)).sum().item() + if valid_loss < best_val_loss: + best_val_loss = valid_loss + best_model = copy.deepcopy(self.model) + + early_stopping(training_loss, self.model, './') + adjust_learning_rate(optimizer, scheduler, + epoch + 1, self.learning_rate, printout=False) + scheduler.step() + + if early_stopping.early_stop: + print("Early stopping") + break + + if best_model is not None: + self.model = best_model + + @convert_to_3d_torch_array + def _predict_model(self, x_test: InputData, output_mode: str = 'default'): + self.model.eval() + if self.fitting_mode == 'zero_padding': + x_test = self._padding(x_test).to(self._device) + pred = self.model(x_test) + elif self.fitting_mode == 'moving_window': + pred = self._moving_window_output(torch.tensor(x_test).float()) + else: + raise ValueError('Unknown prediction mode') + return self._convert_predict(pred, output_mode) + + def _padding(self, ts: np.array): + if ts.shape[-1] == self.input_size: + return torch.tensor(ts).float() + n, ch, size = ts.shape + x = torch.zeros((n, ch, self.input_size)).float() + x[..., :size] = ts + return x + + def _augment_with_zeros(self, batch: np.array): + X, y = zip(*batch) + X, y = np.stack(X), np.stack(y) + X_res, y_res = [], [] + for i in self.prediction_idx: + x = X[...] + x[..., :i + i] = 0 + X_res.append(x) + y_res.append(y) + X_res = np.concatenate(X_res) + y_res = np.concatenate(y_res) + perm = np.random.permutation(X_res.shape[0]) + return torch.tensor(X_res[perm]), torch.tensor(y_res[perm]) + + def _transform_score(self, probas): + # linear interp + thr = self.proba_thr + probas = probas - thr + positive = probas > 0 + probas[positive] *= 1 / (1 - thr) + probas[~positive] *= 1 / thr + return probas diff --git a/fedot_ind/core/repository/data/default_operation_params.json b/fedot_ind/core/repository/data/default_operation_params.json index b875c3225..46c5d8c3c 100644 --- a/fedot_ind/core/repository/data/default_operation_params.json +++ b/fedot_ind/core/repository/data/default_operation_params.json @@ -130,15 +130,25 @@ "min_samples_leaf": 10, "bootstrap": false }, + "ecec": { + "interval_percentage": 10, + "accuracy_importance": 0.7 + }, + "economy_k": { + "interval_percentage": 10, + "accuracy_importance": 0.7, + "cluster_factor": 1, + "lambda": 1 + }, "teaser": { "interval_percentage": 10, "consecutive_predictions": 3, - "hm_shift_to_acc": 2 + "accuracy_importance": 2 }, "proba_threshold_etc": { "interval_percentage": 10, "consecutive_predictions": 3, - "hm_shift_to_acc": 2 + "accuracy_importance": 2 }, "dt": { "max_depth": 5, diff --git a/fedot_ind/core/repository/data/industrial_model_repository.json b/fedot_ind/core/repository/data/industrial_model_repository.json index 0823954a2..aad712d78 100644 --- a/fedot_ind/core/repository/data/industrial_model_repository.json +++ b/fedot_ind/core/repository/data/industrial_model_repository.json @@ -623,10 +623,18 @@ "non_linear" ] }, - "teaser": { + "ecec": { + "meta": "sklearn_class", + "tags": [ + "interpretable", + "non_lagged", + "non_linear" + ], + "input_type": "[DataTypesEnum.table]" + }, + "economy_k": { "meta": "sklearn_class", "tags": [ - "simple", "interpretable", "non_lagged", "non_linear" @@ -643,6 +651,16 @@ ], "input_type": "[DataTypesEnum.table]" }, + "teaser": { + "meta": "sklearn_class", + "tags": [ + "simple", + "interpretable", + "non_lagged", + "non_linear" + ], + "input_type": "[DataTypesEnum.table]" + }, "xgboost": { "meta": "sklearn_class", "presets": ["*tree"], diff --git a/fedot_ind/core/repository/model_repository.py b/fedot_ind/core/repository/model_repository.py index 9777b81c1..722325817 100644 --- a/fedot_ind/core/repository/model_repository.py +++ b/fedot_ind/core/repository/model_repository.py @@ -44,8 +44,10 @@ from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor from xgboost import XGBRegressor -from fedot_ind.core.models.early_tc.teaser import TEASER +from fedot_ind.core.models.early_tc.ecec import ECEC +from fedot_ind.core.models.early_tc.economy_k import EconomyK from fedot_ind.core.models.early_tc.prob_threshold import ProbabilityThresholdClassifier +from fedot_ind.core.models.early_tc.teaser import TEASER from fedot_ind.core.models.manifold.riemann_embeding import RiemannExtractor from fedot_ind.core.models.nn.network_impl.dummy_nn import DummyOverComplicatedNeuralNetwork from fedot_ind.core.models.nn.network_impl.deepar import DeepAR @@ -137,8 +139,10 @@ class AtomizedModel(Enum): # external models 'lgbm': LGBMClassifier, # Early classification + 'ecec': ECEC, + 'economy_k': EconomyK, + 'proba_threshold_etc': ProbabilityThresholdClassifier, 'teaser': TEASER, - 'proba_threshold_etc': ProbabilityThresholdClassifier } FEDOT_PREPROC_MODEL = { # data standartization diff --git a/fedot_ind/core/tuning/search_space.py b/fedot_ind/core/tuning/search_space.py index 11be89db9..25faa8a07 100644 --- a/fedot_ind/core/tuning/search_space.py +++ b/fedot_ind/core/tuning/search_space.py @@ -60,15 +60,41 @@ 'selection_strategy': {'hyperopt-dist': hp.choice, 'sampling-scope': [['sum', 'pairwise']]} }, - 'teaser': + 'ecec': { + 'interval_percentage': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[5, 10, 20, 25]]}, + 'accuracy_importance': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[i / 10 for i in range(11)]]}, + }, + 'economy_k': { + 'interval_percentage': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[5, 10, 20, 25]]}, + 'lambda': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[1e-6, 1e-3, 1e-2, 1e-1, 1, 1e1, 1e2, 1e3, 1e4, 1e6]]}, + 'accuracy_importance': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[i / 10 for i in range(11)]]}, + }, + 'mlstm_model': { + 'interval_percentage': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[5, 10, 20, 25]]}, + 'dropout': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5]]}, + 'hidden_size': {'hyperopt-dist': hp.choice, + 'sampling-scope': [list(range(10, 101, 10))]}, + 'num_layers': {'hyperopt-dist': hp.choice, + 'sampling-scope': [list(range(1, 6))]}, + 'hidden_channels': {'hyperopt-dist': hp.choice, + 'sampling-scope': [8, 16, 32, 64, 96]}, + }, + 'proba_threshold_etc': {'interval_percentage': {'hyperopt-dist': hp.choice, 'sampling-scope': [[5, 10, 20, 25]]}, 'acceptance_threshold': {'hyperopt-dist': hp.choice, 'sampling_scope': [[1, 2, 3, 4, 5]]}, - 'hm_shift_to_acc': {'hyperopt-dist': hp.choice, + 'accuracy_importance': {'hyperopt-dist': hp.choice, 'sampling-scope': [0.01, 0.1, 0.5, 1, 5, 10, 100]}, }, - 'proba_threshold_etc': + 'teaser': {'interval_percentage': {'hyperopt-dist': hp.choice, 'sampling-scope': [[5, 10, 20, 25]]}, 'acceptance_threshold': {'hyperopt-dist': hp.choice, From 96c10091d8f8c6f431d8c3cf29b9f6fca13c74ef Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 12 Jul 2024 15:02:54 +0300 Subject: [PATCH 15/43] slight fixes --- fedot_ind/core/models/early_tc/base_early_tc.py | 2 +- fedot_ind/core/models/early_tc/economy_k.py | 9 ++++++--- .../core/repository/data/default_operation_params.json | 4 ++-- fedot_ind/core/tuning/search_space.py | 6 +++--- 4 files changed, 12 insertions(+), 9 deletions(-) diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index 9fbc162c5..cbed8c463 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -124,7 +124,7 @@ def _score(self, X, y, accuracy_importance=None, training=True): predictions = self._predict(X, training)[0] prediction_points = predictions.shape[0] accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) - return (1 + accuracy_importance) * accuracies * self.earliness[:prediction_points] / (accuracy_importance * accuracies + self.earliness[:prediction_points]) + return (1 - accuracy_importance) * self.earliness[:prediction_points] + accuracy_importance * accuracies def _get_applicable_index(self, last_available_idx): idx = np.searchsorted(self.prediction_idx, last_available_idx, side='right') diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py index bf09acd4b..c39097189 100644 --- a/fedot_ind/core/models/early_tc/economy_k.py +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -65,7 +65,7 @@ def __expected_costs(self, X, cluster_centroids, i): np.sum(self.state[i:], axis=-1), axes=(0, 2, 1) ) * self._pyck_[None, ...], axis=1) costs = cluster_probas @ s_glob.T # n_inst x time_left - costs += self.earliness[None, i:] * (1 - self.accuracy_importance) # subtract or add ? + costs -= self.earliness[None, i:] * (1 - self.accuracy_importance) # subtract or add ? return costs def _get_prediction_time(self, X, cluster_centroids, i): @@ -82,8 +82,11 @@ def predict_proba(self, X): def _transform_score(self, time): idx = self._estimator_for_predict[-1] - scores = -(1 - (time - self.prediction_idx[idx]) / self.prediction_idx[-1]) - scores[scores == 0] = 1 # no posibility for lininterp when sure + scores = (1 - (time - self.prediction_idx[idx]) / self.prediction_idx[-1]) # [1 / n; 1 ] - 1 / n) * n /(n - 1) * 2 - 1 + n = self.n_pred + scores -= 1 / n + scores *= n / (n - 1) * 2 + scores -= 1 return scores diff --git a/fedot_ind/core/repository/data/default_operation_params.json b/fedot_ind/core/repository/data/default_operation_params.json index 46c5d8c3c..0167e0195 100644 --- a/fedot_ind/core/repository/data/default_operation_params.json +++ b/fedot_ind/core/repository/data/default_operation_params.json @@ -143,12 +143,12 @@ "teaser": { "interval_percentage": 10, "consecutive_predictions": 3, - "accuracy_importance": 2 + "accuracy_importance": 0.5 }, "proba_threshold_etc": { "interval_percentage": 10, "consecutive_predictions": 3, - "accuracy_importance": 2 + "accuracy_importance": 0.5 }, "dt": { "max_depth": 5, diff --git a/fedot_ind/core/tuning/search_space.py b/fedot_ind/core/tuning/search_space.py index 25faa8a07..8ab927edb 100644 --- a/fedot_ind/core/tuning/search_space.py +++ b/fedot_ind/core/tuning/search_space.py @@ -92,15 +92,15 @@ 'acceptance_threshold': {'hyperopt-dist': hp.choice, 'sampling_scope': [[1, 2, 3, 4, 5]]}, 'accuracy_importance': {'hyperopt-dist': hp.choice, - 'sampling-scope': [0.01, 0.1, 0.5, 1, 5, 10, 100]}, + 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1,]]}, }, 'teaser': {'interval_percentage': {'hyperopt-dist': hp.choice, 'sampling-scope': [[5, 10, 20, 25]]}, 'acceptance_threshold': {'hyperopt-dist': hp.choice, 'sampling_scope': [[1, 2, 3, 4, 5]]}, - 'hm_shift_to_acc': {'hyperopt-dist': hp.choice, - 'sampling-scope': [0.01, 0.1, 0.5, 1, 5, 10, 100]}, + 'accuracy_importance': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1,]]}, }, 'deepar_model': {'epochs': {'hyperopt-dist': hp.choice, From 743c404b0183e075897a2d026cb7d1cba936fd62 Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 14 Jun 2024 12:21:29 +0300 Subject: [PATCH 16/43] metrics started --- fedot_ind/core/models/early_tc/metrics.py | 122 ++++++++++++++++++++++ fedot_ind/core/models/early_tc/teaser.py | 0 2 files changed, 122 insertions(+) create mode 100644 fedot_ind/core/models/early_tc/metrics.py create mode 100644 fedot_ind/core/models/early_tc/teaser.py diff --git a/fedot_ind/core/models/early_tc/metrics.py b/fedot_ind/core/models/early_tc/metrics.py new file mode 100644 index 000000000..a4cb9cef5 --- /dev/null +++ b/fedot_ind/core/models/early_tc/metrics.py @@ -0,0 +1,122 @@ +from sklearn.metrics import confusion_matrix +import numpy as np +import pandas as pd +from fedot.core.data.data import InputData, OutputData +from typing import Tuple, List, Optional, Union, Literal + +def conf_matrix(actual, predicted): + cm = confusion_matrix(actual, predicted) + return dict(TN=cm[0, 0], FP=cm[0, 1], FN=cm[1, 0], TP=[1, 1]) + +def average_delay(boundaries, prediction, + point, + use_idx=True, + window_placement='lefter'): + cp_confusion = extract_cp_cm(boundaries, prediction, use_idx=use_idx, use_switch_point=False) + # statistics + statistics = { + 'anomalies_num': len(cp_confusion['TPs']) + len(cp_confusion['FPs']), + 'FP_num': len(cp_confusion['FPs']), + 'missed': len(cp_confusion['FNs']) + } + time_func = { + 'righter': lambda triplet: triplet[1] - triplet[0], + 'lefter': lambda triplet: triplet[2] - triplet[1], + 'central': lambda triplet: triplet[1] - triplet[0] - (triplet[2] - triplet[0]) / 2 + }[window_placement] + + detection_history = { + i: time_func(triplet) for i, triplet in cp_confusion['TPs'].items() + } + return detection_history, statistics + + + +def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], + prediction: pd.DataFrame, + use_switch_point: bool = True, # if first anomaly dot is considered as changepoint + use_idx: bool = False): + if isinstance(boundaries, pd.DataFrame): + boundaries = boundaries.values.T + anomaly_tsp = prediction[prediction == 1].sort_index().index + TPs, FNs, FPs = {}, [], [] + + if boundaries.shape[1]: + + FPs += [anomaly_tsp[anomaly_tsp < boundaries[0, 0]]] # left rest + for i, (b_low, b_up) in enumerate(boundaries): + all_tsp_in_window = prediction[b_low: b_up].index + anomaly_tsp_in_window = anomaly_tsp_in_window & anomaly_tsp + if not len(anomaly_tsp_in_window): # why not false positive? do we expect an anomaly to be in every interval? + FNs.append(i if use_idx else all_tsp_in_window) + TPs[i] = [b_low, anomaly_tsp_in_window[int(use_switch_point)] if use_idx else anomaly_tsp_in_window, b_up] + if not use_idx: + FNs.append(all_tsp_in_window - anomaly_tsp_in_window) + FPs.append(anomaly_tsp[anomaly_tsp > boundaries[-1, -1]]) # right rest + else: + FPs.append(anomaly_tsp) + + FPs = np.concatenate(FPs) + FNs = np.concatenate(FNs) + + return dict( + FP=FPs, + FN=FNs, + TP=TPs + ) + + +# cognate of single_detecting_boundaries +def get_boundaries(idx, actual_timestamps, window_size:int = None, + window_placement: Literal['left', 'right', 'central'] = 'left', + intersection_mode: Literal['uniform', 'shift_to_left', 'shift_to_right'] = 'shift_to_left', + ): + # idx = idx + # cast everything to pandas object fir the subsequent comfort + if isinstance(idx, np.array): + if idx.dtype == np.dtype('O'): + idx = pd.to_datetime(pd.Series(idx)) + td = pd.Timedelta(window_size) + else: + idx = pd.Series(idx) + td = window_size + else: + raise TypeError('Unexpected type of ts index') + + boundaries = np.tile(actual_timestamps, (2, 1)) + # [0, ...] - lower bound, [1, ...] - upper + if window_placement == 'left': + boundaries[0] -= td + elif window_placement == 'central': + boundaries[0] -= td / 2 + boundaries[1] += td / 2 + elif window_placement == 'right': + boundaries[1] += td + else: + raise ValueError('Unknown mode') + + if not len(actual_timestamps): + return boundaries + + # intersection resolution + for i in range(len(actual_timestamps) - 1): + if not boundaries[0, i + 1] > boundaries[1, i]: + continue + + if intersection_mode == 'shift_to_left': + boundaries[0, i + 1] = boundaries[1, i] + elif intersection_mode == 'shift_to_right': + boundaries[1, i] = boundaries[0, i + 1] + elif intersection_mode == 'uniform': + boundaries[1, i], boundaries[0, i + 1] = boundaries[0, i + 1], boundaries[1, i] + else: + raise ValueError('Unknown intersection resolution') + + # filtering + idx_to_keep = np.abs(np.diff(boundaries, axis=0)) > 1e-6 + boundaries = boundaries[..., idx_to_keep] + boundaries = pd.DataFrame({'lower': boundaries[0], 'upper': boundaries[1]}) + return boundaries + + + diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py new file mode 100644 index 000000000..e69de29bb From c3de1151c4562ca4246755f6d9eb1e1052c227ed Mon Sep 17 00:00:00 2001 From: leostre Date: Thu, 20 Jun 2024 13:17:30 +0300 Subject: [PATCH 17/43] metrics ended --- fedot_ind/core/models/early_tc/metrics.py | 26 ++++++++++++++++++----- 1 file changed, 21 insertions(+), 5 deletions(-) diff --git a/fedot_ind/core/models/early_tc/metrics.py b/fedot_ind/core/models/early_tc/metrics.py index a4cb9cef5..f4a5f6544 100644 --- a/fedot_ind/core/models/early_tc/metrics.py +++ b/fedot_ind/core/models/early_tc/metrics.py @@ -30,7 +30,8 @@ def average_delay(boundaries, prediction, } return detection_history, statistics - +def tp_transform(tps): + return np.diff(tps[[1, 0]], axis=0) / np.diff(tps[[-1, 0]], axis=0) def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], prediction: pd.DataFrame, @@ -49,7 +50,9 @@ def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], anomaly_tsp_in_window = anomaly_tsp_in_window & anomaly_tsp if not len(anomaly_tsp_in_window): # why not false positive? do we expect an anomaly to be in every interval? FNs.append(i if use_idx else all_tsp_in_window) - TPs[i] = [b_low, anomaly_tsp_in_window[int(use_switch_point)] if use_idx else anomaly_tsp_in_window, b_up] + TPs[i] = [b_low, + anomaly_tsp_in_window[int(use_switch_point)] if use_idx else anomaly_tsp_in_window, + b_up] if not use_idx: FNs.append(all_tsp_in_window - anomaly_tsp_in_window) FPs.append(anomaly_tsp[anomaly_tsp > boundaries[-1, -1]]) # right rest @@ -62,10 +65,9 @@ def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], return dict( FP=FPs, FN=FNs, - TP=TPs + TP=np.stack(TPs) ) - # cognate of single_detecting_boundaries def get_boundaries(idx, actual_timestamps, window_size:int = None, window_placement: Literal['left', 'right', 'central'] = 'left', @@ -118,5 +120,19 @@ def get_boundaries(idx, actual_timestamps, window_size:int = None, boundaries = pd.DataFrame({'lower': boundaries[0], 'upper': boundaries[1]}) return boundaries - +def nab(boundaries, predictions, mode='standard', custom_coefs=None): + inner_coefs = { + 'low_FP': [1.0, -0.11, -1.0], + 'standard': [1., -0.22, -1.], + 'lof_FN': [1., -0.11, -2.] + } + coefs = custom_coefs or inner_coefs[mode] + confusion_matrix = extract_cp_cm(boundaries, predictions) + + tps = confusion_matrix['tps'] + + score = np.inner([tps, len(confusion_matrix['FP']), len(confusion_matrix['FN'])], + coefs) + return score + From d4ee881c22c3afaa31536e43f756d9a637dfdf3c Mon Sep 17 00:00:00 2001 From: leostre Date: Mon, 24 Jun 2024 03:05:51 +0300 Subject: [PATCH 18/43] in basis teaser is completed, need some make-up and add cut ts support --- fedot_ind/core/metrics/interval_metrics.py | 138 +++++++++++++++++++++ fedot_ind/core/models/early_tc/teaser.py | 123 ++++++++++++++++++ 2 files changed, 261 insertions(+) create mode 100644 fedot_ind/core/metrics/interval_metrics.py diff --git a/fedot_ind/core/metrics/interval_metrics.py b/fedot_ind/core/metrics/interval_metrics.py new file mode 100644 index 000000000..f4a5f6544 --- /dev/null +++ b/fedot_ind/core/metrics/interval_metrics.py @@ -0,0 +1,138 @@ +from sklearn.metrics import confusion_matrix +import numpy as np +import pandas as pd +from fedot.core.data.data import InputData, OutputData +from typing import Tuple, List, Optional, Union, Literal + +def conf_matrix(actual, predicted): + cm = confusion_matrix(actual, predicted) + return dict(TN=cm[0, 0], FP=cm[0, 1], FN=cm[1, 0], TP=[1, 1]) + +def average_delay(boundaries, prediction, + point, + use_idx=True, + window_placement='lefter'): + cp_confusion = extract_cp_cm(boundaries, prediction, use_idx=use_idx, use_switch_point=False) + # statistics + statistics = { + 'anomalies_num': len(cp_confusion['TPs']) + len(cp_confusion['FPs']), + 'FP_num': len(cp_confusion['FPs']), + 'missed': len(cp_confusion['FNs']) + } + time_func = { + 'righter': lambda triplet: triplet[1] - triplet[0], + 'lefter': lambda triplet: triplet[2] - triplet[1], + 'central': lambda triplet: triplet[1] - triplet[0] - (triplet[2] - triplet[0]) / 2 + }[window_placement] + + detection_history = { + i: time_func(triplet) for i, triplet in cp_confusion['TPs'].items() + } + return detection_history, statistics + +def tp_transform(tps): + return np.diff(tps[[1, 0]], axis=0) / np.diff(tps[[-1, 0]], axis=0) + +def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], + prediction: pd.DataFrame, + use_switch_point: bool = True, # if first anomaly dot is considered as changepoint + use_idx: bool = False): + if isinstance(boundaries, pd.DataFrame): + boundaries = boundaries.values.T + anomaly_tsp = prediction[prediction == 1].sort_index().index + TPs, FNs, FPs = {}, [], [] + + if boundaries.shape[1]: + + FPs += [anomaly_tsp[anomaly_tsp < boundaries[0, 0]]] # left rest + for i, (b_low, b_up) in enumerate(boundaries): + all_tsp_in_window = prediction[b_low: b_up].index + anomaly_tsp_in_window = anomaly_tsp_in_window & anomaly_tsp + if not len(anomaly_tsp_in_window): # why not false positive? do we expect an anomaly to be in every interval? + FNs.append(i if use_idx else all_tsp_in_window) + TPs[i] = [b_low, + anomaly_tsp_in_window[int(use_switch_point)] if use_idx else anomaly_tsp_in_window, + b_up] + if not use_idx: + FNs.append(all_tsp_in_window - anomaly_tsp_in_window) + FPs.append(anomaly_tsp[anomaly_tsp > boundaries[-1, -1]]) # right rest + else: + FPs.append(anomaly_tsp) + + FPs = np.concatenate(FPs) + FNs = np.concatenate(FNs) + + return dict( + FP=FPs, + FN=FNs, + TP=np.stack(TPs) + ) + +# cognate of single_detecting_boundaries +def get_boundaries(idx, actual_timestamps, window_size:int = None, + window_placement: Literal['left', 'right', 'central'] = 'left', + intersection_mode: Literal['uniform', 'shift_to_left', 'shift_to_right'] = 'shift_to_left', + ): + # idx = idx + # cast everything to pandas object fir the subsequent comfort + if isinstance(idx, np.array): + if idx.dtype == np.dtype('O'): + idx = pd.to_datetime(pd.Series(idx)) + td = pd.Timedelta(window_size) + else: + idx = pd.Series(idx) + td = window_size + else: + raise TypeError('Unexpected type of ts index') + + boundaries = np.tile(actual_timestamps, (2, 1)) + # [0, ...] - lower bound, [1, ...] - upper + if window_placement == 'left': + boundaries[0] -= td + elif window_placement == 'central': + boundaries[0] -= td / 2 + boundaries[1] += td / 2 + elif window_placement == 'right': + boundaries[1] += td + else: + raise ValueError('Unknown mode') + + if not len(actual_timestamps): + return boundaries + + # intersection resolution + for i in range(len(actual_timestamps) - 1): + if not boundaries[0, i + 1] > boundaries[1, i]: + continue + + if intersection_mode == 'shift_to_left': + boundaries[0, i + 1] = boundaries[1, i] + elif intersection_mode == 'shift_to_right': + boundaries[1, i] = boundaries[0, i + 1] + elif intersection_mode == 'uniform': + boundaries[1, i], boundaries[0, i + 1] = boundaries[0, i + 1], boundaries[1, i] + else: + raise ValueError('Unknown intersection resolution') + + # filtering + idx_to_keep = np.abs(np.diff(boundaries, axis=0)) > 1e-6 + boundaries = boundaries[..., idx_to_keep] + boundaries = pd.DataFrame({'lower': boundaries[0], 'upper': boundaries[1]}) + return boundaries + +def nab(boundaries, predictions, mode='standard', custom_coefs=None): + inner_coefs = { + 'low_FP': [1.0, -0.11, -1.0], + 'standard': [1., -0.22, -1.], + 'lof_FN': [1., -0.11, -2.] + } + coefs = custom_coefs or inner_coefs[mode] + confusion_matrix = extract_cp_cm(boundaries, predictions) + + tps = confusion_matrix['tps'] + + score = np.inner([tps, len(confusion_matrix['FP']), len(confusion_matrix['FN'])], + coefs) + return score + + diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index e69de29bb..66dc88745 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -0,0 +1,123 @@ +from typing import Union, List, Optional +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot.core.data.data import InputData, OutputData +from sklearn.svm import OneClassSVM +from sklearn.preprocessing import StandardScaler +from sktime.classification.dictionary_based import MUSE, WEASEL +from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation +from fedot.core.operations.operation_parameters import OperationParameters + + +class TEASER(ModelImplementation): + def __init__(self, params: Optional[OperationParameters] = None): + super().__init__() + if params is None: + params = {} + self.interval_length = params.get('interval_length', 10) # rewrite as interval_length + self.acceptance_threshold = params.get('acceptance_threshold', 5) + self.hm_shift_to_acc = params.get('hm_shift_to_acc', 1.) + assert self.acceptance_threshold < self.interval_length, 'Not enough checkpoints for prediction proof' + # how to pass into ? % what needed + self.oc_svm_params = {} + self.weasel_params = {} + self.random_state = None # is needed? + + def _init_model(self, max_data_length): + self.prediction_idx = self._compute_prediction_points(max_data_length) + self.n_pred = len(self.prediction_idx) + self.oc_estimators = [OneClassSVM(**self.oc_svm_params) for _ in range(self.n_pred)] + self.slave_estimators = [WEASEL(random_state=self.random_state, support_probabilities=True, **self.weasel_params) for _ in range(self.n_pred)] + self.scalers = [StandardScaler() for _ in range(self.n_pred)] # do we need them separate? no inverse path expected + + def fit(self, input_data: InputData): + input_data = self.__convert_pd(input_data) + X, y = input_data.features, input_data.target # what's passed in case of classification to training? + self._init_model(max_data_length=X.shape[-1]) + for i in range(self.n_pred): + self._fit_one_interval(X, y, i) + + def _fit_one_interval(self, X, y, i): + X_part = X[..., :self.prediction_idx[i]] # what's dimensionality of input? will it work in case of multivariate? + X_part = self.scalers[i].fit_transform(X_part) + probas = self.slave_estimators[i].fit_predict_proba(X_part, y) + filtered_probas = self._filter_positive(probas, y) # + X_oc = self._form_X_oc(filtered_probas) + self.oc_estimators[i].fit(X_oc, y) + + def _predict_one_slave(self, X, i): + X_part = X[..., :self.prediction_idx[i]] + X_part = self.scalers[i].transform(X_part) + probas = self.slave_estimators[i].predict_proba(X_part) + X_oc = self._form_X_oc(probas) + return X_oc, np.argmax(probas, axis=-1) + + def _compute_prediction_points(self, n_idx): + """Computes indices for prediction, includes last index, first interval may be greater""" + prediction_idx = np.arange(n_idx - 1, -1, -self.interval_length)[::-1] + self.earliness = 1 - prediction_idx / n_idx + return prediction_idx + + def _filter_positive(self, predicted_probas, y): # different logic in sktime + predicted_labels = np.argmax(predicted_probas, axis=-1).flatten() + return predicted_probas[predicted_labels == y] + + def _form_X_oc(self, predicted_probas): + d = (predicted_probas.max() - predicted_probas) + d[d == 0] = 1 + d = d.min(axis=-1).reshape(-1, 1) + return np.hstack([predicted_probas, d]) + + def _predict(self, X): + n = X.shape[0] + self.states = np.ones((n, self.n_pred, 2)) # num_consec, class + X_ocs, predicted_labels = zip( + *[self._predict_one_slave(X, i) for i in range(self.n_pred)] + ) + non_acceptance = self._consecutive_count(predicted_labels) < self.acceptance_threshold + to_oc_check = np.argwhere(non_acceptance) + X_ocs = np.stack(X_ocs) + predicted_labels = np.stack(predicted_labels) + # for each point of estimation + for i in range(self.n_pred): + # find not accepted points + ith_point_to_oc = to_oc_check[to_oc_check[:, 0] == i, 1] + X_to_ith = X_ocs[i][ith_point_to_oc] + # if they are not outliers + final_verdict = self.oc_estimators[i].predict(X_to_ith) # 1 for accept -1 for reject + # mark as accepted + non_acceptance[i, np.argwhere(final_verdict == 1).flatten()] = False + predicted_labels[non_acceptance] = -1 + return predicted_labels + + def _consecutive_count(self, predicted_labels: List[np.array]): + n = len(predicted_labels[0]) + consecutive_labels = np.ones((self.n_pred, n)) + for i in range(1, self.n_pred): + equal = predicted_labels[i - 1] == predicted_labels[i] + consecutive_labels[i, equal] = consecutive_labels[i - 1, equal] + 1 + return consecutive_labels # n_pred x n_instances + + def __convert_pd(self, input_data): + if hasattr(input_data.features, 'values'): + input_data.features = input_data.features.values + if hasattr(input_data.target, 'values'): + input_data.target = input_data.target.values + return input_data + + def predict(self, input_data: InputData) -> OutputData: + input_data = self.__convert_pd(input_data) + prediction = self._predict(input_data.features) + return self._convert_to_output(input_data, predict=prediction) + + def predict_for_fit(self, input_data: InputData) -> OutputData: + return self.predict(input_data) + + def _score(self, X, y, hm_shift_to_acc=None): + hm_shift_to_acc = hm_shift_to_acc or self.hm_shift_to_acc + predictions = self._predict(X) + accuracies = (predictions == np.tile(y, (1, self.n_pred))).sum(axis=1) / len(y) + return (1 + hm_shift_to_acc) * accuracies * self.earliness / (hm_shift_to_acc * accuracies + self.earliness) + + def _tune_oc(self): + #TODO + pass From 588846a5c6c3ac76fdd15cc6ee66bd39912cc8f9 Mon Sep 17 00:00:00 2001 From: leostre Date: Wed, 26 Jun 2024 17:09:09 +0300 Subject: [PATCH 19/43] teaser inherits sklearn's classifier mixin now --- fedot_ind/core/models/early_tc/__init__.py | 0 fedot_ind/core/models/early_tc/teaser.py | 61 +++++++++++++------ .../data/default_operation_params.json | 7 ++- .../data/industrial_model_repository.json | 11 ++++ fedot_ind/core/repository/model_repository.py | 5 +- fedot_ind/core/tuning/search_space.py | 24 ++++++++ tests/unit/core/models/test_teaser.py | 35 +++++++++++ 7 files changed, 121 insertions(+), 22 deletions(-) create mode 100644 fedot_ind/core/models/early_tc/__init__.py create mode 100644 tests/unit/core/models/test_teaser.py diff --git a/fedot_ind/core/models/early_tc/__init__.py b/fedot_ind/core/models/early_tc/__init__.py new file mode 100644 index 000000000..e69de29bb diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 66dc88745..66a031fd4 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -3,6 +3,7 @@ from fedot.core.data.data import InputData, OutputData from sklearn.svm import OneClassSVM from sklearn.preprocessing import StandardScaler +from sklearn.model_selection import GridSearchCV from sktime.classification.dictionary_based import MUSE, WEASEL from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation from fedot.core.operations.operation_parameters import OperationParameters @@ -13,21 +14,25 @@ def __init__(self, params: Optional[OperationParameters] = None): super().__init__() if params is None: params = {} + self.prediction_mode = params.get('prediction_mode', 'best_by_harmonic_mean') self.interval_length = params.get('interval_length', 10) # rewrite as interval_length self.acceptance_threshold = params.get('acceptance_threshold', 5) self.hm_shift_to_acc = params.get('hm_shift_to_acc', 1.) assert self.acceptance_threshold < self.interval_length, 'Not enough checkpoints for prediction proof' + # how to pass into ? % what needed - self.oc_svm_params = {} + self._oc_svm_params = [100, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1.5, 1] self.weasel_params = {} self.random_state = None # is needed? def _init_model(self, max_data_length): self.prediction_idx = self._compute_prediction_points(max_data_length) self.n_pred = len(self.prediction_idx) - self.oc_estimators = [OneClassSVM(**self.oc_svm_params) for _ in range(self.n_pred)] + self.oc_estimators = [None] * self.n_pred self.slave_estimators = [WEASEL(random_state=self.random_state, support_probabilities=True, **self.weasel_params) for _ in range(self.n_pred)] - self.scalers = [StandardScaler() for _ in range(self.n_pred)] # do we need them separate? no inverse path expected + self.scalers = [StandardScaler() for _ in range(self.n_pred)] + self.__offset = max_data_length % self.interval_length + self.best_estimator_idx = -1 def fit(self, input_data: InputData): input_data = self.__convert_pd(input_data) @@ -35,17 +40,22 @@ def fit(self, input_data: InputData): self._init_model(max_data_length=X.shape[-1]) for i in range(self.n_pred): self._fit_one_interval(X, y, i) + self.best_estimator_idx = np.argmax(self._score(X, y, self.hm_shift_to_acc)) def _fit_one_interval(self, X, y, i): - X_part = X[..., :self.prediction_idx[i]] # what's dimensionality of input? will it work in case of multivariate? + X_part = X[..., :self.prediction_idx[i] + 1] # what's dimensionality of input? will it work in case of multivariate? X_part = self.scalers[i].fit_transform(X_part) probas = self.slave_estimators[i].fit_predict_proba(X_part, y) - filtered_probas = self._filter_positive(probas, y) # + filtered_probas = self._filter_trues(probas, y) # X_oc = self._form_X_oc(filtered_probas) - self.oc_estimators[i].fit(X_oc, y) + self.oc_estimators[i] = GridSearchCV(OneClassSVM(), + param_grid={"gamma": self._oc_svm_params}, + scoring='accuracy', + cv=min(X.shape[0], 10) + ).fit(X_oc, np.ones((len(X_oc), 1))).best_estimator_ - def _predict_one_slave(self, X, i): - X_part = X[..., :self.prediction_idx[i]] + def _predict_one_slave(self, X, i, offset=0): + X_part = X[..., max(0, offset - 1):self.prediction_idx[i] + 1] X_part = self.scalers[i].transform(X_part) probas = self.slave_estimators[i].predict_proba(X_part) X_oc = self._form_X_oc(probas) @@ -57,7 +67,7 @@ def _compute_prediction_points(self, n_idx): self.earliness = 1 - prediction_idx / n_idx return prediction_idx - def _filter_positive(self, predicted_probas, y): # different logic in sktime + def _filter_trues(self, predicted_probas, y): # different logic in sktime predicted_labels = np.argmax(predicted_probas, axis=-1).flatten() return predicted_probas[predicted_labels == y] @@ -70,15 +80,20 @@ def _form_X_oc(self, predicted_probas): def _predict(self, X): n = X.shape[0] self.states = np.ones((n, self.n_pred, 2)) # num_consec, class + if self.prediction_mode == 'best_by_harmonic_mean': + estimator_indices = [self.best_estimator_idx] + else: + last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) + estimator_indices = list(range(last_idx + 1)) X_ocs, predicted_labels = zip( - *[self._predict_one_slave(X, i) for i in range(self.n_pred)] + *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary ) non_acceptance = self._consecutive_count(predicted_labels) < self.acceptance_threshold to_oc_check = np.argwhere(non_acceptance) X_ocs = np.stack(X_ocs) predicted_labels = np.stack(predicted_labels) # for each point of estimation - for i in range(self.n_pred): + for i in range(predicted_labels.shape[0]): # find not accepted points ith_point_to_oc = to_oc_check[to_oc_check[:, 0] == i, 1] X_to_ith = X_ocs[i][ith_point_to_oc] @@ -87,15 +102,16 @@ def _predict(self, X): # mark as accepted non_acceptance[i, np.argwhere(final_verdict == 1).flatten()] = False predicted_labels[non_acceptance] = -1 - return predicted_labels + return predicted_labels # prediction_points x n_instances def _consecutive_count(self, predicted_labels: List[np.array]): n = len(predicted_labels[0]) - consecutive_labels = np.ones((self.n_pred, n)) - for i in range(1, self.n_pred): + prediction_points = len(predicted_labels) + consecutive_labels = np.ones((prediction_points, n)) + for i in range(1, prediction_points): equal = predicted_labels[i - 1] == predicted_labels[i] consecutive_labels[i, equal] = consecutive_labels[i - 1, equal] + 1 - return consecutive_labels # n_pred x n_instances + return consecutive_labels # prediction_points x n_instances def __convert_pd(self, input_data): if hasattr(input_data.features, 'values'): @@ -115,9 +131,14 @@ def predict_for_fit(self, input_data: InputData) -> OutputData: def _score(self, X, y, hm_shift_to_acc=None): hm_shift_to_acc = hm_shift_to_acc or self.hm_shift_to_acc predictions = self._predict(X) - accuracies = (predictions == np.tile(y, (1, self.n_pred))).sum(axis=1) / len(y) - return (1 + hm_shift_to_acc) * accuracies * self.earliness / (hm_shift_to_acc * accuracies + self.earliness) + prediction_points = predictions.shape[0] + accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) + return (1 + hm_shift_to_acc) * accuracies * self.earliness[:prediction_points] / (hm_shift_to_acc * accuracies + self.earliness[:prediction_points]) - def _tune_oc(self): - #TODO - pass + def _get_applicable_index(self, last_available_idx): + idx = np.searchsorted(self.prediction_idx, last_available_idx, side='right') + if idx == 0: + raise RuntimeError('Too few points for prediction!') + idx -= 1 + offset = last_available_idx - self.prediction_idx[idx] + return idx, offset diff --git a/fedot_ind/core/repository/data/default_operation_params.json b/fedot_ind/core/repository/data/default_operation_params.json index 2ac985979..3f3cfbfe5 100644 --- a/fedot_ind/core/repository/data/default_operation_params.json +++ b/fedot_ind/core/repository/data/default_operation_params.json @@ -124,6 +124,11 @@ "min_samples_leaf": 10, "bootstrap": false }, + "teaser": { + "interval_length": 10, + "acceptance_threshold": 3, + "hm_shift_to_acc": 2 + }, "dt": { "max_depth": 5, "min_samples_split": 10, @@ -438,4 +443,4 @@ "kernel": "rbf", "gamma": "auto" } -} \ No newline at end of file +} diff --git a/fedot_ind/core/repository/data/industrial_model_repository.json b/fedot_ind/core/repository/data/industrial_model_repository.json index c4a87aefb..78674cfba 100644 --- a/fedot_ind/core/repository/data/industrial_model_repository.json +++ b/fedot_ind/core/repository/data/industrial_model_repository.json @@ -729,6 +729,17 @@ "non_linear" ] }, + "teaser": { + "meta": "ts_model", + "presets": ["fast_train", "ts"], + "tags": [ + "simple", + "interpretable", + "non_lagged", + "non_linear" + ], + "input_type": "[DataTypesEnum.ts]" + }, "xgboost": { "meta": "sklearn_class", "presets": ["*tree"], diff --git a/fedot_ind/core/repository/model_repository.py b/fedot_ind/core/repository/model_repository.py index ab73b3c85..da4ae22e3 100644 --- a/fedot_ind/core/repository/model_repository.py +++ b/fedot_ind/core/repository/model_repository.py @@ -45,6 +45,7 @@ from fedot_ind.core.models.detection.custom.stat_detector import StatisticalDetector from fedot_ind.core.models.detection.probalistic.kalman import UnscentedKalmanFilter from fedot_ind.core.models.detection.subspaces.sst import SingularSpectrumTransformation +from fedot_ind.core.models.early_tc.teaser import TEASER from fedot_ind.core.models.manifold.riemann_embeding import RiemannExtractor from fedot_ind.core.models.nn.network_impl.dummy_nn import DummyOverComplicatedNeuralNetwork from fedot_ind.core.models.nn.network_impl.deepar import DeepAR @@ -88,7 +89,9 @@ class AtomizedModel(Enum): # external models 'lgbm': LGBMClassifier, # for detection - 'one_class_svm': OneClassSVM + 'one_class_svm': OneClassSVM, + # Early classification + 'teaser': TEASER } FEDOT_PREPROC_MODEL = { # data standartization diff --git a/fedot_ind/core/tuning/search_space.py b/fedot_ind/core/tuning/search_space.py index 9d1f6c858..4cff3aa96 100644 --- a/fedot_ind/core/tuning/search_space.py +++ b/fedot_ind/core/tuning/search_space.py @@ -65,6 +65,30 @@ 'selection_strategy': {'hyperopt-dist': hp.choice, 'sampling-scope': [['sum', 'pairwise']]} }, + 'teaser': + {'interval_percentage': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[5, 10, 20, 25]]}, + 'acceptance_threshold': {'hyperopt-dist': hp.choice, + 'sampling_scope': [[1, 2, 3, 4, 5]]}, + 'hm_shift_to_acc': {'hyperopt-dist': hp.choice, + 'sampling-scope': [0.01, 0.1, 0.5, 1, 5, 10, 100]}, + }, + 'deepar_model': + {'epochs': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[x for x in range(10, 100, 10)]]}, + 'batch_size': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[x for x in range(8, 64, 6)]]}, + 'dropout': {'hyperopt-dist': hp.choice, + 'sampling-scope': [list(range(0, 0.6, 0.1))]}, + 'rnn_layers':{'hyperopt-dist': hp.choice, + 'sampling-scope': [range(1, 6)]}, + 'hidden_size':{'hyperopt-dist': hp.choice, + 'sampling-scope': [list(range(10, 101, 10))]}, + 'cell_type':{'hyperopt-dist': hp.choice, + 'sampling-scope': [['GRU', 'LSTM', 'RNN']]}, + 'expected_distribution': {'hyperopt-dist': hp.choice, + 'sampling-scope': [['normal', 'cauchy']]} + }, 'patch_tst_model': {'epochs': {'hyperopt-dist': hp.choice, 'sampling-scope': [[x for x in range(10, 100, 10)]]}, 'batch_size': {'hyperopt-dist': hp.choice, 'sampling-scope': [[x for x in range(8, 64, 6)]]}, diff --git a/tests/unit/core/models/test_teaser.py b/tests/unit/core/models/test_teaser.py new file mode 100644 index 000000000..2bc19b8de --- /dev/null +++ b/tests/unit/core/models/test_teaser.py @@ -0,0 +1,35 @@ +import pytest +import numpy as np +from fedot_ind.core.models.early_tc import teaser as TEASER + + +@pytest.fixture(scope='module') +def teaser(): + teaser = TEASER.TEASER({'interval_length': 10, 'prediction_mode': ''}) + return teaser + +@pytest.fixture(scope='module') +def xy(): + return np.random.randn((2, 23)), np.random.randint(0, 2, size=(2, 1)) + +def test_get_applicable_index(teaser): + teaser._init_model(23) + idx, offset = teaser._get_last_applicable_idx(100) + assert offset == 100 - 22, 'Wrong offset estimation when right edge' + assert idx == len(teaser.prediction_idx) - 1 + idx, offset = teaser._get_last_applicable_idx(12) + assert offset == 100 - teaser.prediction_idx[idx], 'Wrong offset estimation in the middle' + assert idx == len(teaser.prediction_idx) - 1 + +def test_compute_prediction_points(teaser): + indices = teaser._compute_prediction_points(23) + assert 2 in indices + assert 22 in indices + assert 23 not in indices + +# def test_consecutive_count(teaser): +# pass + +# def test_score(teaser): + + From d939a340d1e6dead45344749dcbf43d6af2a49bc Mon Sep 17 00:00:00 2001 From: leostre Date: Thu, 27 Jun 2024 18:22:34 +0300 Subject: [PATCH 20/43] class tree reconf. added proba_thresholding classifier (not registered) --- .../core/models/early_tc/base_early_tc.py | 117 +++++++++++++++++ .../core/models/early_tc/prob_threshold.py | 46 +++++++ fedot_ind/core/models/early_tc/teaser.py | 123 +++++------------- 3 files changed, 194 insertions(+), 92 deletions(-) create mode 100644 fedot_ind/core/models/early_tc/base_early_tc.py create mode 100644 fedot_ind/core/models/early_tc/prob_threshold.py diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py new file mode 100644 index 000000000..f97ba0593 --- /dev/null +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -0,0 +1,117 @@ +from typing import Union, List, Optional +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data +from fedot.core.data.data import InputData, OutputData +from sklearn.svm import OneClassSVM +from sklearn.preprocessing import StandardScaler +from sklearn.model_selection import GridSearchCV +from sklearn.base import ClassifierMixin, BaseEstimator +from sktime.classification.dictionary_based import MUSE, WEASEL +from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation +from fedot.core.operations.operation_parameters import OperationParameters +from fedot.core.repository.dataset_types import DataTypesEnum +from fedot.core.repository.tasks import Task, TaskTypesEnum + + +class BaseETC(ClassifierMixin, BaseEstimator): + def __init__(self, params: Optional[OperationParameters] = None): + if params is None: + params = {} + super().__init__() + self.prediction_mode = params.get('prediction_mode', 'best_by_harmonic_mean') + self.interval_percentage = params.get('interval_percentage', 10) + self.consecutive_predictions = params.get('consecutive_predictions', 3) + self.hm_shift_to_acc = params.get('hm_shift_to_acc', 1.) + self.random_state = params.get('random_state', None) + self.weasel_params = {} + assert self.consecutive_predictions < self.interval_percentage, 'Not enough checkpoints for prediction proof' + + def _init_model(self, X, y): + max_data_length = X.shape[-1] + self.prediction_idx = self._compute_prediction_points(max_data_length) + self.n_pred = len(self.prediction_idx) + self.slave_estimators = [WEASEL(random_state=self.random_state, support_probabilities=True, **self.weasel_params) for _ in range(self.n_pred)] + self.scalers = [StandardScaler() for _ in range(self.n_pred)] + self._best_estimator_idx = -1 + self.classes_ = [np.unique(y)] + + @property + def required_length(self): + if not hasattr(self, '_best_estimator_idx'): + return None + return self.prediction_idx[self._best_estimator_idx] + + def fit(self, X, y=None): + assert y is not None, 'Pass y' + y = np.array(y).flatten() + self._init_model(X, y) + for i in range(self.n_pred): + self._fit_one_interval(X, y, i) + self._best_estimator_idx = np.argmax(self._score(X, y, self.hm_shift_to_acc)) + + def _fit_one_interval(self, X, y, i): + X_part = X[..., :self.prediction_idx[i] + 1] # what's dimensionality of input? will it work in case of multivariate? + X_part = self.scalers[i].fit_transform(X_part) + probas = self.slave_estimators[i].fit_predict_proba(X_part, y) + return probas + + def _predict_one_slave(self, X, i, offset=0): + X_part = X[..., max(0, offset - 1):self.prediction_idx[i] + 1] + X_part = self.scalers[i].transform(X_part) + probas = self.slave_estimators[i].predict_proba(X_part) + return probas, np.argmax(probas, axis=-1) + + def _compute_prediction_points(self, n_idx): + interval_length = int(n_idx * self.interval_percentage / 100) + prediction_idx = np.arange(n_idx - 1, -1, -interval_length)[::-1] + self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 + return prediction_idx + + def _select_estimators(self, X): + offset = 0 + if self.prediction_mode == 'best_by_harmonic_mean': + estimator_indices = [self._best_estimator_idx] + elif self.prediction_mode == 'all': + last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) + estimator_indices = np.arange(last_idx + 1) + else: + raise ValueError('Unknown prediction mode') + return estimator_indices, offset + + def _predict(self, X,): + estimator_indices, offset = self._select_estimators(X) + predicted_probas, predicted_labels = zip( + *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary + ) + return predicted_labels, predicted_probas + + def _consecutive_count(self, predicted_labels: List[np.array]): + n = len(predicted_labels[0]) + prediction_points = len(predicted_labels) + consecutive_labels = np.ones((prediction_points, n)) + for i in range(1, prediction_points): + equal = predicted_labels[i - 1] == predicted_labels[i] + consecutive_labels[i, equal] = consecutive_labels[i - 1, equal] + 1 + return consecutive_labels # prediction_points x n_instances + + def predict_proba(self, X): + raise NotImplementedError + + def predict(self, X): + raise NotImplementedError + + def _score(self, X, y, hm_shift_to_acc=None): + y = np.array(y).flatten() + hm_shift_to_acc = hm_shift_to_acc or self.hm_shift_to_acc + predictions, *_ = self._predict(X) + prediction_points = predictions.shape[0] + accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) + return (1 + hm_shift_to_acc) * accuracies * self.earliness[:prediction_points] / (hm_shift_to_acc * accuracies + self.earliness[:prediction_points]) + + def _get_applicable_index(self, last_available_idx): + idx = np.searchsorted(self.prediction_idx, last_available_idx, side='right') + if idx == 0: + raise RuntimeError('Too few points for prediction!') + idx -= 1 + offset = last_available_idx - self.prediction_idx[idx] + return idx, offset diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py new file mode 100644 index 000000000..0433de34a --- /dev/null +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -0,0 +1,46 @@ +from typing import Union, List, Optional +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data +from fedot.core.data.data import InputData, OutputData +from sklearn.svm import OneClassSVM +from sklearn.preprocessing import StandardScaler +from sklearn.model_selection import GridSearchCV +from sklearn.base import ClassifierMixin, BaseEstimator +from sktime.classification.dictionary_based import MUSE, WEASEL +from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation +from fedot.core.operations.operation_parameters import OperationParameters +from fedot.core.repository.dataset_types import DataTypesEnum +from fedot.core.repository.tasks import Task, TaskTypesEnum +from fedot_ind.core.models.early_tc.base_early_tc import BaseETC + +class ProbabilityThresholdClassifier(BaseETC): + def __init__(self, params: Optional[OperationParameters] = None): + if params is None: + params = {} + super().__init__() + self.probability_threshold = params.get('probability_threshold', None) + + def _init_model(self, X, y): + super()._init_model(X, y) + if self.probability_threshold is None: + self.probability_threshold = 1 / len(self.classes_[0]) + + def predict_proba(self, X): + _, predicted_probas, non_acceptance = self._predict(X) + predicted_probas[non_acceptance] = 0 + return predicted_probas.squeeze() + + def predict(self, X): + predicted_labels, _, non_acceptance = self._predict(X) + predicted_labels[non_acceptance] = -1 + # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] + return predicted_labels # prediction_points x n_instances + + def _predict(self, X): + predicted_labels, predicted_probas = super()._predict(X) + predicted_probas = np.stack(predicted_probas) + predicted_labels = np.stack(predicted_labels) + non_acceptance = self._consecutive_count(predicted_labels) < self.consecutive_predictions + double_check = predicted_probas.max(axis=-1) > self.probability_threshold + non_acceptance[non_acceptance & double_check] = False + return predicted_labels, predicted_probas, non_acceptance diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 66a031fd4..2809824c8 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -1,51 +1,30 @@ from typing import Union, List, Optional from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data from fedot.core.data.data import InputData, OutputData from sklearn.svm import OneClassSVM from sklearn.preprocessing import StandardScaler from sklearn.model_selection import GridSearchCV +from sklearn.base import ClassifierMixin, BaseEstimator from sktime.classification.dictionary_based import MUSE, WEASEL from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation from fedot.core.operations.operation_parameters import OperationParameters +from fedot.core.repository.dataset_types import DataTypesEnum +from fedot.core.repository.tasks import Task, TaskTypesEnum +from fedot_ind.core.models.early_tc.base_early_tc import BaseETC -class TEASER(ModelImplementation): +class TEASER(BaseETC): def __init__(self, params: Optional[OperationParameters] = None): - super().__init__() - if params is None: - params = {} - self.prediction_mode = params.get('prediction_mode', 'best_by_harmonic_mean') - self.interval_length = params.get('interval_length', 10) # rewrite as interval_length - self.acceptance_threshold = params.get('acceptance_threshold', 5) - self.hm_shift_to_acc = params.get('hm_shift_to_acc', 1.) - assert self.acceptance_threshold < self.interval_length, 'Not enough checkpoints for prediction proof' + super().__init__(params) + self._oc_svm_params = (100., 10., 5., 2.5, 1.5, 1., 0.5, 0.25, 0.1) - # how to pass into ? % what needed - self._oc_svm_params = [100, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1.5, 1] - self.weasel_params = {} - self.random_state = None # is needed? - - def _init_model(self, max_data_length): - self.prediction_idx = self._compute_prediction_points(max_data_length) - self.n_pred = len(self.prediction_idx) + def _init_model(self, X, y): + super()._init_model(X, y) self.oc_estimators = [None] * self.n_pred - self.slave_estimators = [WEASEL(random_state=self.random_state, support_probabilities=True, **self.weasel_params) for _ in range(self.n_pred)] - self.scalers = [StandardScaler() for _ in range(self.n_pred)] - self.__offset = max_data_length % self.interval_length - self.best_estimator_idx = -1 - - def fit(self, input_data: InputData): - input_data = self.__convert_pd(input_data) - X, y = input_data.features, input_data.target # what's passed in case of classification to training? - self._init_model(max_data_length=X.shape[-1]) - for i in range(self.n_pred): - self._fit_one_interval(X, y, i) - self.best_estimator_idx = np.argmax(self._score(X, y, self.hm_shift_to_acc)) def _fit_one_interval(self, X, y, i): - X_part = X[..., :self.prediction_idx[i] + 1] # what's dimensionality of input? will it work in case of multivariate? - X_part = self.scalers[i].fit_transform(X_part) - probas = self.slave_estimators[i].fit_predict_proba(X_part, y) + probas = super()._fit_one_interval(X, y, i) filtered_probas = self._filter_trues(probas, y) # X_oc = self._form_X_oc(filtered_probas) self.oc_estimators[i] = GridSearchCV(OneClassSVM(), @@ -55,17 +34,9 @@ def _fit_one_interval(self, X, y, i): ).fit(X_oc, np.ones((len(X_oc), 1))).best_estimator_ def _predict_one_slave(self, X, i, offset=0): - X_part = X[..., max(0, offset - 1):self.prediction_idx[i] + 1] - X_part = self.scalers[i].transform(X_part) - probas = self.slave_estimators[i].predict_proba(X_part) + probas, labels = super()._predict_one_slave(X, i, offset) X_oc = self._form_X_oc(probas) - return X_oc, np.argmax(probas, axis=-1) - - def _compute_prediction_points(self, n_idx): - """Computes indices for prediction, includes last index, first interval may be greater""" - prediction_idx = np.arange(n_idx - 1, -1, -self.interval_length)[::-1] - self.earliness = 1 - prediction_idx / n_idx - return prediction_idx + return X_oc, probas, labels def _filter_trues(self, predicted_probas, y): # different logic in sktime predicted_labels = np.argmax(predicted_probas, axis=-1).flatten() @@ -78,67 +49,35 @@ def _form_X_oc(self, predicted_probas): return np.hstack([predicted_probas, d]) def _predict(self, X): - n = X.shape[0] - self.states = np.ones((n, self.n_pred, 2)) # num_consec, class - if self.prediction_mode == 'best_by_harmonic_mean': - estimator_indices = [self.best_estimator_idx] - else: - last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) - estimator_indices = list(range(last_idx + 1)) - X_ocs, predicted_labels = zip( + estimator_indices, offset = self._select_estimators(X) + X_ocs, predicted_probas, predicted_labels = zip( *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary ) - non_acceptance = self._consecutive_count(predicted_labels) < self.acceptance_threshold + non_acceptance = self._consecutive_count(predicted_labels) < self.consecutive_predictions to_oc_check = np.argwhere(non_acceptance) X_ocs = np.stack(X_ocs) + predicted_probas = np.stack(predicted_probas) predicted_labels = np.stack(predicted_labels) + final_verdicts = np.zeros((len(estimator_indices), X.shape[0])) # for each point of estimation for i in range(predicted_labels.shape[0]): # find not accepted points ith_point_to_oc = to_oc_check[to_oc_check[:, 0] == i, 1] X_to_ith = X_ocs[i][ith_point_to_oc] # if they are not outliers - final_verdict = self.oc_estimators[i].predict(X_to_ith) # 1 for accept -1 for reject + final_verdict = self.oc_estimators[estimator_indices[i]].decision_function(X_to_ith) # 1 for accept -1 for reject # mark as accepted - non_acceptance[i, np.argwhere(final_verdict == 1).flatten()] = False + non_acceptance[i, np.argwhere(final_verdict >= 0).flatten()] = False + final_verdicts[i] = final_verdict + return predicted_labels, predicted_probas, non_acceptance, final_verdicts + + def predict_proba(self, X): + _, predicted_probas, non_acceptance, final_verdicts = self._predict(X) + predicted_probas[non_acceptance] = final_verdicts[non_acceptance, None] + return predicted_probas.squeeze() + + def predict(self, X): + predicted_labels, _, non_acceptance, final_verdicts = self._predict(X) predicted_labels[non_acceptance] = -1 + # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] return predicted_labels # prediction_points x n_instances - - def _consecutive_count(self, predicted_labels: List[np.array]): - n = len(predicted_labels[0]) - prediction_points = len(predicted_labels) - consecutive_labels = np.ones((prediction_points, n)) - for i in range(1, prediction_points): - equal = predicted_labels[i - 1] == predicted_labels[i] - consecutive_labels[i, equal] = consecutive_labels[i - 1, equal] + 1 - return consecutive_labels # prediction_points x n_instances - - def __convert_pd(self, input_data): - if hasattr(input_data.features, 'values'): - input_data.features = input_data.features.values - if hasattr(input_data.target, 'values'): - input_data.target = input_data.target.values - return input_data - - def predict(self, input_data: InputData) -> OutputData: - input_data = self.__convert_pd(input_data) - prediction = self._predict(input_data.features) - return self._convert_to_output(input_data, predict=prediction) - - def predict_for_fit(self, input_data: InputData) -> OutputData: - return self.predict(input_data) - - def _score(self, X, y, hm_shift_to_acc=None): - hm_shift_to_acc = hm_shift_to_acc or self.hm_shift_to_acc - predictions = self._predict(X) - prediction_points = predictions.shape[0] - accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) - return (1 + hm_shift_to_acc) * accuracies * self.earliness[:prediction_points] / (hm_shift_to_acc * accuracies + self.earliness[:prediction_points]) - - def _get_applicable_index(self, last_available_idx): - idx = np.searchsorted(self.prediction_idx, last_available_idx, side='right') - if idx == 0: - raise RuntimeError('Too few points for prediction!') - idx -= 1 - offset = last_available_idx - self.prediction_idx[idx] - return idx, offset From 4d3e57dd0efee6add236d1ae68dd107feee52f83 Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 28 Jun 2024 14:11:17 +0300 Subject: [PATCH 21/43] both etc models are registered, available via api --- fedot_ind/core/models/early_tc/base_early_tc.py | 11 ++--------- .../core/models/early_tc/prob_threshold.py | 12 +----------- fedot_ind/core/models/early_tc/teaser.py | 10 +--------- .../data/default_operation_params.json | 9 +++++++-- .../data/industrial_model_repository.json | 17 +++++++++++++---- fedot_ind/core/repository/model_repository.py | 4 +++- fedot_ind/core/tuning/search_space.py | 12 ++++++++++-- 7 files changed, 37 insertions(+), 38 deletions(-) diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index f97ba0593..c7b84bedf 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -1,16 +1,9 @@ -from typing import Union, List, Optional +from typing import Optional, List from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data -from fedot.core.data.data import InputData, OutputData -from sklearn.svm import OneClassSVM from sklearn.preprocessing import StandardScaler -from sklearn.model_selection import GridSearchCV from sklearn.base import ClassifierMixin, BaseEstimator -from sktime.classification.dictionary_based import MUSE, WEASEL -from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation +from sktime.classification.dictionary_based import WEASEL from fedot.core.operations.operation_parameters import OperationParameters -from fedot.core.repository.dataset_types import DataTypesEnum -from fedot.core.repository.tasks import Task, TaskTypesEnum class BaseETC(ClassifierMixin, BaseEstimator): diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index 0433de34a..343077cbe 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -1,16 +1,6 @@ -from typing import Union, List, Optional +from typing import Optional from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data -from fedot.core.data.data import InputData, OutputData -from sklearn.svm import OneClassSVM -from sklearn.preprocessing import StandardScaler -from sklearn.model_selection import GridSearchCV -from sklearn.base import ClassifierMixin, BaseEstimator -from sktime.classification.dictionary_based import MUSE, WEASEL -from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation from fedot.core.operations.operation_parameters import OperationParameters -from fedot.core.repository.dataset_types import DataTypesEnum -from fedot.core.repository.tasks import Task, TaskTypesEnum from fedot_ind.core.models.early_tc.base_early_tc import BaseETC class ProbabilityThresholdClassifier(BaseETC): diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 2809824c8..f5d2590b3 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -1,16 +1,8 @@ -from typing import Union, List, Optional +from typing import Optional from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.architecture.abstraction.decorators import convert_to_input_data -from fedot.core.data.data import InputData, OutputData from sklearn.svm import OneClassSVM -from sklearn.preprocessing import StandardScaler from sklearn.model_selection import GridSearchCV -from sklearn.base import ClassifierMixin, BaseEstimator -from sktime.classification.dictionary_based import MUSE, WEASEL -from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation from fedot.core.operations.operation_parameters import OperationParameters -from fedot.core.repository.dataset_types import DataTypesEnum -from fedot.core.repository.tasks import Task, TaskTypesEnum from fedot_ind.core.models.early_tc.base_early_tc import BaseETC diff --git a/fedot_ind/core/repository/data/default_operation_params.json b/fedot_ind/core/repository/data/default_operation_params.json index 3f3cfbfe5..11980e4b4 100644 --- a/fedot_ind/core/repository/data/default_operation_params.json +++ b/fedot_ind/core/repository/data/default_operation_params.json @@ -125,8 +125,13 @@ "bootstrap": false }, "teaser": { - "interval_length": 10, - "acceptance_threshold": 3, + "interval_percentage": 10, + "consecutive_predictions": 3, + "hm_shift_to_acc": 2 + }, + "proba_threshold_etc": { + "interval_percentage": 10, + "consecutive_predictions": 3, "hm_shift_to_acc": 2 }, "dt": { diff --git a/fedot_ind/core/repository/data/industrial_model_repository.json b/fedot_ind/core/repository/data/industrial_model_repository.json index 78674cfba..ccbd1e0a7 100644 --- a/fedot_ind/core/repository/data/industrial_model_repository.json +++ b/fedot_ind/core/repository/data/industrial_model_repository.json @@ -623,7 +623,7 @@ }, "ridge": { "meta": "sklearn_regr", - "presets": ["fast_train", "ts"], + "presets": ["fast_train"], "tags": [ "simple", "linear", @@ -730,15 +730,24 @@ ] }, "teaser": { - "meta": "ts_model", - "presets": ["fast_train", "ts"], + "meta": "sklearn_class", "tags": [ "simple", "interpretable", "non_lagged", "non_linear" ], - "input_type": "[DataTypesEnum.ts]" + "input_type": "[DataTypesEnum.table]" + }, + "proba_threshold_etc": { + "meta": "sklearn_class", + "tags": [ + "simple", + "interpretable", + "non_lagged", + "non_linear" + ], + "input_type": "[DataTypesEnum.table]" }, "xgboost": { "meta": "sklearn_class", diff --git a/fedot_ind/core/repository/model_repository.py b/fedot_ind/core/repository/model_repository.py index da4ae22e3..ac23c4f22 100644 --- a/fedot_ind/core/repository/model_repository.py +++ b/fedot_ind/core/repository/model_repository.py @@ -46,6 +46,7 @@ from fedot_ind.core.models.detection.probalistic.kalman import UnscentedKalmanFilter from fedot_ind.core.models.detection.subspaces.sst import SingularSpectrumTransformation from fedot_ind.core.models.early_tc.teaser import TEASER +from fedot_ind.core.models.early_tc.prob_threshold import ProbabilityThresholdClassifier from fedot_ind.core.models.manifold.riemann_embeding import RiemannExtractor from fedot_ind.core.models.nn.network_impl.dummy_nn import DummyOverComplicatedNeuralNetwork from fedot_ind.core.models.nn.network_impl.deepar import DeepAR @@ -91,7 +92,8 @@ class AtomizedModel(Enum): # for detection 'one_class_svm': OneClassSVM, # Early classification - 'teaser': TEASER + 'teaser': TEASER, + 'proba_threshold_etc': ProbabilityThresholdClassifier } FEDOT_PREPROC_MODEL = { # data standartization diff --git a/fedot_ind/core/tuning/search_space.py b/fedot_ind/core/tuning/search_space.py index 4cff3aa96..994db4e51 100644 --- a/fedot_ind/core/tuning/search_space.py +++ b/fedot_ind/core/tuning/search_space.py @@ -73,15 +73,23 @@ 'hm_shift_to_acc': {'hyperopt-dist': hp.choice, 'sampling-scope': [0.01, 0.1, 0.5, 1, 5, 10, 100]}, }, + 'proba_threshold_etc': + {'interval_percentage': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[5, 10, 20, 25]]}, + 'acceptance_threshold': {'hyperopt-dist': hp.choice, + 'sampling_scope': [[1, 2, 3, 4, 5]]}, + 'hm_shift_to_acc': {'hyperopt-dist': hp.choice, + 'sampling-scope': [0.01, 0.1, 0.5, 1, 5, 10, 100]}, + }, 'deepar_model': {'epochs': {'hyperopt-dist': hp.choice, 'sampling-scope': [[x for x in range(10, 100, 10)]]}, 'batch_size': {'hyperopt-dist': hp.choice, 'sampling-scope': [[x for x in range(8, 64, 6)]]}, 'dropout': {'hyperopt-dist': hp.choice, - 'sampling-scope': [list(range(0, 0.6, 0.1))]}, + 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5]]}, 'rnn_layers':{'hyperopt-dist': hp.choice, - 'sampling-scope': [range(1, 6)]}, + 'sampling-scope': [list(range(1, 6))]}, 'hidden_size':{'hyperopt-dist': hp.choice, 'sampling-scope': [list(range(10, 101, 10))]}, 'cell_type':{'hyperopt-dist': hp.choice, From 4da7c13cb5b778b435c532111480426e137af223 Mon Sep 17 00:00:00 2001 From: leostre Date: Tue, 2 Jul 2024 15:27:34 +0300 Subject: [PATCH 22/43] ecec added --- .../core/models/early_tc/base_early_tc.py | 22 ++++--- fedot_ind/core/models/early_tc/ecec.py | 62 +++++++++++++++++++ .../core/models/early_tc/prob_threshold.py | 7 ++- fedot_ind/core/models/early_tc/teaser.py | 9 +++ 4 files changed, 88 insertions(+), 12 deletions(-) create mode 100644 fedot_ind/core/models/early_tc/ecec.py diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index c7b84bedf..5da8e61bd 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -33,6 +33,10 @@ def required_length(self): if not hasattr(self, '_best_estimator_idx'): return None return self.prediction_idx[self._best_estimator_idx] + + @property + def n_classes(self): + return len(self.classes_[0]) def fit(self, X, y=None): assert y is not None, 'Pass y' @@ -40,7 +44,6 @@ def fit(self, X, y=None): self._init_model(X, y) for i in range(self.n_pred): self._fit_one_interval(X, y, i) - self._best_estimator_idx = np.argmax(self._score(X, y, self.hm_shift_to_acc)) def _fit_one_interval(self, X, y, i): X_part = X[..., :self.prediction_idx[i] + 1] # what's dimensionality of input? will it work in case of multivariate? @@ -60,23 +63,23 @@ def _compute_prediction_points(self, n_idx): self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 return prediction_idx - def _select_estimators(self, X): + def _select_estimators(self, X, training=False): offset = 0 - if self.prediction_mode == 'best_by_harmonic_mean': + if not training and self.prediction_mode == 'best_by_harmonic_mean': estimator_indices = [self._best_estimator_idx] - elif self.prediction_mode == 'all': + elif training or self.prediction_mode == 'all': last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) estimator_indices = np.arange(last_idx + 1) else: raise ValueError('Unknown prediction mode') return estimator_indices, offset - def _predict(self, X,): - estimator_indices, offset = self._select_estimators(X) - predicted_probas, predicted_labels = zip( + def _predict(self, X, training=True): + estimator_indices, offset = self._select_estimators(X, training) + prediction = zip( *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary ) - return predicted_labels, predicted_probas + return prediction # see the output in _predict_one_slave def _consecutive_count(self, predicted_labels: List[np.array]): n = len(predicted_labels[0]) @@ -96,11 +99,12 @@ def predict(self, X): def _score(self, X, y, hm_shift_to_acc=None): y = np.array(y).flatten() hm_shift_to_acc = hm_shift_to_acc or self.hm_shift_to_acc - predictions, *_ = self._predict(X) + predictions = self._predict(X)[0] prediction_points = predictions.shape[0] accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) return (1 + hm_shift_to_acc) * accuracies * self.earliness[:prediction_points] / (hm_shift_to_acc * accuracies + self.earliness[:prediction_points]) + def _get_applicable_index(self, last_available_idx): idx = np.searchsorted(self.prediction_idx, last_available_idx, side='right') if idx == 0: diff --git a/fedot_ind/core/models/early_tc/ecec.py b/fedot_ind/core/models/early_tc/ecec.py new file mode 100644 index 000000000..a00df631d --- /dev/null +++ b/fedot_ind/core/models/early_tc/ecec.py @@ -0,0 +1,62 @@ +from typing import Optional +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot.core.operations.operation_parameters import OperationParameters +from fedot_ind.core.models.early_tc.base_early_tc import BaseETC +from sklearn.model_selection import cross_val_predict +from sklearn.base import clone +from sklearn.metrics import confusion_matrix + +class ECEC(BaseETC): + def __init__(self, params: Optional[OperationParameters] = None): + super().__init__(params) + + def _init_model(self, X, y): + super()._init_model(X, y) + self._confidences = np.ones((X.shape[0], self.n_pred)) + + def _score(self, X, y, alpha): + y = y.astype(int) + predicted_labels = np.stack(super()._predict(X)[0]).astype(int) # n_pred x n_inst + n = predicted_labels.shape[0] + accuracies = (predicted_labels == np.tile(y, (1, n))) # n_pred x n_inst + confidences = np.ones((n, X.shape[0]), dtype='float32') + for i in range(n): + y_pred = predicted_labels[i] + reliability_i = confusion_matrix(y, y_pred, normalize='pred') + confidences[i] = 1 - reliability_i[y, y_pred] # n_inst + confidences = 1 - np.cumprod(confidences, axis=0) # n_pred x n_inst + candidates = self._select_thrs(confidences) # n_candidates + cfs = np.zeros_like(candidates) + for i, candidate in enumerate(candidates): + mask = confidences >= candidate # n_pred x n_inst + accuracy_for_candidate = (accuracies * mask).sum(1) / mask.sum(1) # n_pred + cfs[i] = self.cost_func(self.earliness, accuracy_for_candidate, alpha) + return candidates[np.argmin(cfs)] + + @staticmethod + def _select_thrs(confidences): + C = np.unique(confidences.round(3)) + difference = np.diff(C) + pair_means = C[:-1] + difference / 2 + difference_shifted = np.roll(difference, 1) + difference_idx = np.argwhere(difference > difference_shifted) + return pair_means[difference_idx].flatten() + + @staticmethod + def cost_func(earliness, accuracies, alpha): + return alpha * accuracies + (1 - alpha) * earliness + + def fit(self, X, y): + self.confidence_threshold = super().fit(X, y) + + + + + + + + + + + + diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index 343077cbe..f6c9ab65d 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -21,15 +21,16 @@ def predict_proba(self, X): return predicted_probas.squeeze() def predict(self, X): - predicted_labels, _, non_acceptance = self._predict(X) + predicted_labels, _, non_acceptance = self._predict(X, training=False) predicted_labels[non_acceptance] = -1 # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] return predicted_labels # prediction_points x n_instances - def _predict(self, X): - predicted_labels, predicted_probas = super()._predict(X) + def _predict(self, X, training=True): + predicted_probas, predicted_labels = super()._predict(X, training) predicted_probas = np.stack(predicted_probas) predicted_labels = np.stack(predicted_labels) + # print(predicted_labels.shape, predicted_probas.shape) non_acceptance = self._consecutive_count(predicted_labels) < self.consecutive_predictions double_check = predicted_probas.max(axis=-1) > self.probability_threshold non_acceptance[non_acceptance & double_check] = False diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index f5d2590b3..ff58cf72d 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -73,3 +73,12 @@ def predict(self, X): predicted_labels[non_acceptance] = -1 # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] return predicted_labels # prediction_points x n_instances + + def _score(self, X, y, hm_shift_to_acc=None): + scores = super()._score(X, y, hm_shift_to_acc) + self._best_estimator_idx = np.argmax(scores) + return scores + + def fit(self, X, y): + super().fit(X, y) + return self._score(X, y, self.hm_shift_to_acc) From d11fa8d2bb776f110b98719b991c53cd2542701e Mon Sep 17 00:00:00 2001 From: leostre Date: Thu, 4 Jul 2024 18:23:13 +0300 Subject: [PATCH 23/43] economy_k added --- .../core/models/early_tc/base_early_tc.py | 9 +- fedot_ind/core/models/early_tc/economy_k.py | 89 +++++++++++++++++++ .../core/models/early_tc/prob_threshold.py | 10 +++ fedot_ind/core/models/early_tc/teaser.py | 6 +- 4 files changed, 107 insertions(+), 7 deletions(-) create mode 100644 fedot_ind/core/models/early_tc/economy_k.py diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index 5da8e61bd..5e180c2a9 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -14,7 +14,8 @@ def __init__(self, params: Optional[OperationParameters] = None): self.prediction_mode = params.get('prediction_mode', 'best_by_harmonic_mean') self.interval_percentage = params.get('interval_percentage', 10) self.consecutive_predictions = params.get('consecutive_predictions', 3) - self.hm_shift_to_acc = params.get('hm_shift_to_acc', 1.) + self.accuracy_importance = params.get('accuracy_importance', 1.) + self.min_ts_length = params.get('min_ts_step', 3) self.random_state = params.get('random_state', None) self.weasel_params = {} assert self.consecutive_predictions < self.interval_percentage, 'Not enough checkpoints for prediction proof' @@ -58,8 +59,8 @@ def _predict_one_slave(self, X, i, offset=0): return probas, np.argmax(probas, axis=-1) def _compute_prediction_points(self, n_idx): - interval_length = int(n_idx * self.interval_percentage / 100) - prediction_idx = np.arange(n_idx - 1, -1, -interval_length)[::-1] + interval_length = max(int(n_idx * self.interval_percentage / 100), self.min_ts_length) + prediction_idx = np.arange(n_idx - 1, -1, -interval_length)[::-1][1:] self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 return prediction_idx @@ -98,7 +99,7 @@ def predict(self, X): def _score(self, X, y, hm_shift_to_acc=None): y = np.array(y).flatten() - hm_shift_to_acc = hm_shift_to_acc or self.hm_shift_to_acc + hm_shift_to_acc = hm_shift_to_acc or self.accuracy_importance predictions = self._predict(X)[0] prediction_points = predictions.shape[0] accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py new file mode 100644 index 000000000..639e680cd --- /dev/null +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -0,0 +1,89 @@ +from typing import Optional +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot.core.operations.operation_parameters import OperationParameters +from fedot_ind.core.models.early_tc.base_early_tc import BaseETC +from sklearn.cluster import KMeans +from sklearn.metrics import confusion_matrix +from sklearn.model_selection import train_test_split, cross_val_predict + +class EconomyK(BaseETC): + def __init__(self, params: Optional[OperationParameters] = None): + if params is None: + params = {} + super().__init__(params) + self.lambda_ = params.get('lambda', 1.) + self._cluster_factor = params.get('cluster_factor' , 1) + self._random_state = 2104 + self.__cv = 5 + + def _init_model(self, X, y): + super()._init_model(X, y) + self.n_clusters = int(self._cluster_factor * self.n_classes) + self._clusterizer = KMeans(self.n_clusters, random_state=self._random_state) + self.state = np.zeros((self.n_pred, self.n_clusters, self.n_classes, self.n_classes)) + + def fit(self, X, y): + y = y.flatten().astype(int) + self._init_model(X, y) + self._pyck_ = confusion_matrix(y, self._clusterizer.fit(X).labels_, normalize='true')[:self.n_classes, :self.n_clusters] + for i in range(self.n_pred): + self._fit_one_interval(X, y, i) + + def _fit_one_interval(self, X, y, i): + X_part = X[..., :self.prediction_idx[i] + 1] + X_part = self.scalers[i].fit_transform(X_part) + y_pred = cross_val_predict(self.slave_estimators[i], X_part, y, cv=self.__cv) + self.slave_estimators[i].fit(X_part, y) + states_by_i = np.zeros(( self.n_clusters, self.n_classes, self.n_classes)) + np.add.at(states_by_i, (self._clusterizer.labels_, y, y_pred), 1) + states_by_i /= np.mean(states_by_i, -2, keepdims=True) + states_by_i[np.isnan(states_by_i)] = 0 + states_by_i[:, np.eye(self.n_classes).astype(bool)] = 0 + self.state[i] = states_by_i + + def _predict_one_slave(self, X, i, offset=0): + cluster_centers = self._clusterizer.cluster_centers_[:, :self.prediction_idx[i] + 1] # n_clust x len + X_part = X[..., max(0, offset - 1):self.prediction_idx[i] + 1] # n_inst x len + X_part = self.scalers[i].transform(X_part) + probas = self.slave_estimators[i].predict_proba(X_part) + optimal_time, is_optimal = self._get_prediction_time(X_part, cluster_centers, i) + return probas, optimal_time, is_optimal + + def __cluster_probas(self, X, centroids): + length = centroids.shape[-1] + diffs = np.subtract.outer(X, centroids).swapaxes(1, 2) + diffs = diffs[..., np.eye(length).astype(bool)] # n_inst x n_clust x len + distances = np.linalg.norm(diffs, axis=-1) + delta_k = 1. - distances / distances.mean(axis=-1)[:, None] + s = 1. / (1. + np.exp(-self.lambda_ * delta_k)) + return s / s.sum(axis=-1)[:, None] # n_inst x n_clust + + def __expected_costs(self, X, cluster_centroids, i): + cluster_probas = self.__cluster_probas(X, cluster_centroids) # n_inst x n_clust + s_glob = np.sum(np.transpose( + np.sum(self.state[i:], axis=-1), axes=(0, 2, 1) + ) * self._pyck_[None, ...], axis=1) + costs = cluster_probas @ s_glob.T # n_inst x time_left + costs += self.earliness[None, i:] * (1 - self.accuracy_importance) # subtract or add ? + return costs + + def _get_prediction_time(self, X, cluster_centroids, i): + costs = self.__expected_costs(X, cluster_centroids, i) + min_costs = np.argmin(costs, axis=-1) + is_optimal = min_costs == 0 + time_optimal = self.prediction_idx[min_costs + i] + return time_optimal, is_optimal # n_inst + + def predict_proba(self, X): + probas, times, is_optimal = self._predict(X) + is_optimal = np.stack(is_optimal) + idx = np.tile(np.arange(self.n_pred), (is_optimal.shape[1], 1)).T # n_pred x n_inst + idx[~is_optimal] = self.n_pred + idx = np.argmin(idx, 0) + probas = np.stack(probas) + return probas[idx], np.stack(times)[idx] + + def predict(self, X): + probas, times = self.predict_proba(X) + labels = probas.argmax(-1) + return labels, times diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index f6c9ab65d..51d169909 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -35,3 +35,13 @@ def _predict(self, X, training=True): double_check = predicted_probas.max(axis=-1) > self.probability_threshold non_acceptance[non_acceptance & double_check] = False return predicted_labels, predicted_probas, non_acceptance + + def _score(self, X, y, accuracy_importance=None): + scores = super()._score(X, y, accuracy_importance) + self._best_estimator_idx = np.argmax(scores) + return scores + + def fit(self, X, y): + super().fit(X, y) + return self._score(X, y, self.accuracy_importance) + diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index ff58cf72d..c03c5d1e6 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -74,11 +74,11 @@ def predict(self, X): # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] return predicted_labels # prediction_points x n_instances - def _score(self, X, y, hm_shift_to_acc=None): - scores = super()._score(X, y, hm_shift_to_acc) + def _score(self, X, y, accuracy_importance=None): + scores = super()._score(X, y, accuracy_importance) self._best_estimator_idx = np.argmax(scores) return scores def fit(self, X, y): super().fit(X, y) - return self._score(X, y, self.hm_shift_to_acc) + return self._score(X, y, self.accuracy_importance) From 9f1624401b0693126c2984247505c00ea6cf11bb Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 5 Jul 2024 12:30:52 +0300 Subject: [PATCH 24/43] mlstm init --- .../core/models/nn/network_impl/mlstm.py | 127 ++++++++++++++++++ 1 file changed, 127 insertions(+) create mode 100644 fedot_ind/core/models/nn/network_impl/mlstm.py diff --git a/fedot_ind/core/models/nn/network_impl/mlstm.py b/fedot_ind/core/models/nn/network_impl/mlstm.py new file mode 100644 index 000000000..31ca6fbd4 --- /dev/null +++ b/fedot_ind/core/models/nn/network_impl/mlstm.py @@ -0,0 +1,127 @@ +from fedot_ind.core.models.nn.network_impl.base_nn_model import BaseNeuralModel +from typing import Optional, Callable, Any, List, Union +from fedot.core.operations.operation_parameters import OperationParameters +from fedot.core.data.data import InputData, OutputData +from fedot_ind.core.repository.constanst_repository import CROSS_ENTROPY, MULTI_CLASS_CROSS_ENTROPY, RMSE +import torch.optim as optim +import torch.nn as nn +import torch.nn.functional as F +import torch +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array +import pandas as pd +from fedot.core.repository.tasks import Task, TaskTypesEnum, TsForecastingParams +from fedot_ind.core.models.nn.network_modules.layers.special import adjust_learning_rate, EarlyStopping +from fedot.core.repository.dataset_types import DataTypesEnum +from fedot_ind.core.architecture.preprocessing.data_convertor import DataConverter +import torch.utils.data as data +from fedot_ind.core.architecture.settings.computational import default_device + +class SqueezeExciteBlock(nn.Module): + def __init__(self, input_channels, filters, reduce=4): + super().__init__() + self.filters = filters + self.pool = nn.AvgPool1d(input_channels) + self.bottleneck = max(self.filters // reduce, 4) + self.fc1 = nn.Linear(self.filters, self.bottleneck, bias=False) + self.fc2 = nn.Linear(self.bottleneck, self.filters, bias=False) + torch.nn.init.kaiming_normal_(self.fc1.weight.data) + torch.nn.init.kaiming_normal_(self.fc2.weight.data) + + def forward(self, x): + input_x = x + x = self.pool(x) + x = F.relu(self.fc1(x.view(-1, 1, self.filters))) + x = F.sigmoid(self.fc2(x)) + x = x.view(-1, self.filters, 1) * input_x + return x + +class MLSTM_module(nn.Module): + def __init__(self, input_size, input_channels, + inner_size, inner_channels, + output_size, num_layers, dropout=0.25): + super().__init__() + self.proj = nn.Linear(input_size * inner_channels + input_channels * inner_size, output_size) + self.lstm = nn.LSTM(input_size, inner_size, num_layers, + batch_first=True, dropout=dropout) + self.conv_branch = nn.Sequential( + nn.Conv1d(input_channels, inner_channels, + padding='same', + kernel_size=9), + nn.BatchNorm1d(inner_channels), + nn.ReLU(), + SqueezeExciteBlock(input_size, inner_channels), + nn.Conv1d(inner_channels, inner_channels * 2, + padding='same', + kernel_size=5, + ), # c x l | n x c x l + nn.BatchNorm1d(inner_channels * 2), # n x c | n x c x l + nn.ReLU(), + SqueezeExciteBlock(input_size, inner_channels * 2), + nn.Conv1d(inner_channels * 2, inner_channels, + padding='same', + kernel_size=3, + ), # c x l | n x c x l + nn.BatchNorm1d(inner_channels), # n x c | n x c x l + nn.ReLU(), + ) + seq = next(iter(self.conv_branch.modules())) + idx = [0, 4, 8] + for i in idx: + torch.nn.init.kaiming_uniform_(seq[i].weight.data) + + def forward(self, x): + x_lstm, _ = self.lstm(x) # n x input_ch x inner_size + x_conv = self.conv_branch(x) # n x inner_ch x len + print(x_conv.size(), x_lstm.size()) + x = torch.cat([torch.flatten(x_lstm, start_dim=1), torch.flatten(x_conv, start_dim=1)], dim=-1) + x = F.softmax(self.proj(x)) + return x + + +class MLSTM(BaseNeuralModel): + def __init__(self, params: Optional[OperationParameters] = None): + if params is None: + params = {} + super().__init__() + # self.num_classes = params.get('num_classes', None) + # self.epochs = params.get('epochs', 100) + # self.batch_size = params.get('batch_size', 16) + # self.activation = params.get('activation', 'ReLU') + # self.learning_rate = 0.001 + + self.dropout = params.get('dropout', 0.25) + self.hidden_size = params.get('hidden_size', 64) + self.hidden_channels = params.get('hidden_channels', 32) + self.num_layers = params.get('num_layers', 2) + # self.target = None + # self.task_type = None + + def _init_model(self, ts: InputData): + _, input_channels, input_size = ts.features.shape + self.model = MLSTM_module(input_size, input_channels, + self.hidden_size, self.hidden_channels, + self.num_classes, self.num_layers, + self.dropout) + self.model_for_inference = MLSTM_module(input_size, input_channels, + self.hidden_size, self.hidden_channels, + self.num_classes, self.num_layers, + self.dropout) + optimizer = optim.Adam(self.model.parameters(), lr=0.001) + if ts.num_classes == 2: + loss_fn = CROSS_ENTROPY() + else: + loss_fn = MULTI_CLASS_CROSS_ENTROPY() + return loss_fn, optimizer + + @convert_to_3d_torch_array + def _fit_model(self, ts: InputData): + loss_fn, optimizer = self._init_model(ts) + train_loader, val_loader = self._prepare_data(ts, split_data=True) + self._train_loop( + train_loader=train_loader, + val_loader=val_loader, + loss_fn=loss_fn, + optimizer=optimizer + ) + From d118462f3c88c44f66959552ada7af205f13349d Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 5 Jul 2024 12:30:52 +0300 Subject: [PATCH 25/43] mlstm registered --- .../architecture/abstraction/decorators.py | 5 +- fedot_ind/core/models/early_tc/ecec.py | 62 ++++--- .../core/models/nn/network_impl/mlstm.py | 154 ++++++++++++++++++ .../data/default_operation_params.json | 4 + .../data/industrial_model_repository.json | 6 + fedot_ind/core/repository/model_repository.py | 5 +- 6 files changed, 211 insertions(+), 25 deletions(-) diff --git a/fedot_ind/core/architecture/abstraction/decorators.py b/fedot_ind/core/architecture/abstraction/decorators.py index 1e854be56..0b915c85c 100644 --- a/fedot_ind/core/architecture/abstraction/decorators.py +++ b/fedot_ind/core/architecture/abstraction/decorators.py @@ -42,13 +42,14 @@ def decorated_func(self, *args): def convert_to_3d_torch_array(func): def decorated_func(self, *args): - init_data = args[0] + init_data, *args = args data = DataConverter(data=init_data).convert_to_torch_format() if isinstance(init_data, InputData): init_data.features = data else: init_data = data - return func(self, init_data, *args[1:]) + return func(self, init_data, *args) + return decorated_func diff --git a/fedot_ind/core/models/early_tc/ecec.py b/fedot_ind/core/models/early_tc/ecec.py index a00df631d..45f7f9fe4 100644 --- a/fedot_ind/core/models/early_tc/ecec.py +++ b/fedot_ind/core/models/early_tc/ecec.py @@ -12,26 +12,53 @@ def __init__(self, params: Optional[OperationParameters] = None): def _init_model(self, X, y): super()._init_model(X, y) - self._confidences = np.ones((X.shape[0], self.n_pred)) + self._reliabilities = np.zeros((self.n_pred, self.n_classes, self.n_classes)) + + def _predict_one_slave(self, X, i, offset=0): + predicted_probas, predicted_labels = super()._predict_one_slave(X, i, offset) + reliabilities = self._reliabilities[i, predicted_labels, predicted_labels].flatten() # n_inst + return predicted_labels.astype(int), predicted_probas, reliabilities + + def _predict(self, X, training=False): + predicted_labels, predicted_probas, reliabilities = super()._predict(X, training) + reliabilities = np.stack(reliabilities) + confidences = 1 - np.cumprod(1 - reliabilities, axis=0) + non_confident = confidences < self.confidence_thresholds[:len(predicted_labels), None] + return predicted_labels, predicted_probas, non_confident, confidences - def _score(self, X, y, alpha): + def predict(self, X): + predicted_labels, _, non_confident, confidences = self._predict(X) + predicted_labels = np.stack(predicted_labels) + predicted_labels[non_confident] = -1 + return predicted_labels, confidences + + def predict_proba(self, X): + _, predicted_probas, non_confident, confidences = self._predict(X) + predicted_probas = np.stack(predicted_probas) + predicted_probas[non_confident] = -1 + return predicted_probas, confidences + + def _score(self, X, y, alpha, training=False): y = y.astype(int) - predicted_labels = np.stack(super()._predict(X)[0]).astype(int) # n_pred x n_inst + predicted_labels, *_ = super()._predict(X, training) # n_pred x n_inst + predicted_labels = np.stack(predicted_labels) n = predicted_labels.shape[0] - accuracies = (predicted_labels == np.tile(y, (1, n))) # n_pred x n_inst + accuracies = (predicted_labels == np.tile(y, (n, 1))) # n_pred x n_inst confidences = np.ones((n, X.shape[0]), dtype='float32') for i in range(n): y_pred = predicted_labels[i] reliability_i = confusion_matrix(y, y_pred, normalize='pred') confidences[i] = 1 - reliability_i[y, y_pred] # n_inst + self._reliabilities[i] = reliability_i confidences = 1 - np.cumprod(confidences, axis=0) # n_pred x n_inst candidates = self._select_thrs(confidences) # n_candidates - cfs = np.zeros_like(candidates) + cfs = np.zeros((len(candidates), n)) for i, candidate in enumerate(candidates): mask = confidences >= candidate # n_pred x n_inst accuracy_for_candidate = (accuracies * mask).sum(1) / mask.sum(1) # n_pred cfs[i] = self.cost_func(self.earliness, accuracy_for_candidate, alpha) - return candidates[np.argmin(cfs)] + self._best_estimator_idx = np.argmin(cfs.mean(0)) + return candidates[np.argmin(cfs, axis=0)] # n_pred @staticmethod def _select_thrs(confidences): @@ -39,24 +66,15 @@ def _select_thrs(confidences): difference = np.diff(C) pair_means = C[:-1] + difference / 2 difference_shifted = np.roll(difference, 1) - difference_idx = np.argwhere(difference > difference_shifted) - return pair_means[difference_idx].flatten() + difference_idx = np.argwhere(difference <= difference_shifted) + means_candidates = pair_means[difference_idx].flatten() + return means_candidates if len(means_candidates) else C @staticmethod def cost_func(earliness, accuracies, alpha): - return alpha * accuracies + (1 - alpha) * earliness + return alpha * (1 - accuracies) + (1 - alpha) * earliness def fit(self, X, y): - self.confidence_threshold = super().fit(X, y) - - - - - - - - - - - - + super().fit(X, y) + self.confidence_thresholds = self._score(X, y, self.accuracy_importance, training=True) + \ No newline at end of file diff --git a/fedot_ind/core/models/nn/network_impl/mlstm.py b/fedot_ind/core/models/nn/network_impl/mlstm.py index 31ca6fbd4..9a0a52ba6 100644 --- a/fedot_ind/core/models/nn/network_impl/mlstm.py +++ b/fedot_ind/core/models/nn/network_impl/mlstm.py @@ -125,3 +125,157 @@ def _fit_model(self, ts: InputData): optimizer=optimizer ) + +from fedot_ind.core.models.nn.network_impl.base_nn_model import BaseNeuralModel +from typing import Optional, Callable, Any, List, Union +from fedot.core.operations.operation_parameters import OperationParameters +from fedot.core.data.data import InputData, OutputData +from fedot_ind.core.repository.constanst_repository import CROSS_ENTROPY, MULTI_CLASS_CROSS_ENTROPY, RMSE +import torch.optim as optim +import torch.nn as nn +import torch.nn.functional as F +import torch +from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array +import pandas as pd +from fedot.core.repository.tasks import Task, TaskTypesEnum, TsForecastingParams +from fedot_ind.core.models.nn.network_modules.layers.special import adjust_learning_rate, EarlyStopping +from fedot.core.repository.dataset_types import DataTypesEnum +from fedot_ind.core.architecture.preprocessing.data_convertor import DataConverter +import torch.utils.data as data +from fedot_ind.core.architecture.settings.computational import default_device + +class SqueezeExciteBlock(nn.Module): + def __init__(self, input_channels, filters, reduce=4): + super().__init__() + self.filters = filters + self.pool = nn.AvgPool1d(input_channels) + self.bottleneck = max(self.filters // reduce, 4) + self.fc1 = nn.Linear(self.filters, self.bottleneck, bias=False) + self.fc2 = nn.Linear(self.bottleneck, self.filters, bias=False) + torch.nn.init.kaiming_normal_(self.fc1.weight.data) + torch.nn.init.kaiming_normal_(self.fc2.weight.data) + + def forward(self, x): + input_x = x + x = self.pool(x) + x = F.relu(self.fc1(x.view(-1, 1, self.filters))) + x = F.sigmoid(self.fc2(x)) + x = x.view(-1, self.filters, 1) * input_x + return x + +class MLSTM_module(nn.Module): + def __init__(self, input_size, input_channels, + inner_size, inner_channels, + output_size, num_layers, dropout=0.25): + super().__init__() + self.proj = nn.Linear(input_size * inner_channels + input_channels * inner_size, output_size) + self.lstm = nn.LSTM(input_size, inner_size, num_layers, + batch_first=True, dropout=dropout) + self.conv_branch = nn.Sequential( + nn.Conv1d(input_channels, inner_channels, + padding='same', + kernel_size=9), + nn.BatchNorm1d(inner_channels), + nn.ReLU(), + SqueezeExciteBlock(input_size, inner_channels), + nn.Conv1d(inner_channels, inner_channels * 2, + padding='same', + kernel_size=5, + ), # c x l | n x c x l + nn.BatchNorm1d(inner_channels * 2), # n x c | n x c x l + nn.ReLU(), + SqueezeExciteBlock(input_size, inner_channels * 2), + nn.Conv1d(inner_channels * 2, inner_channels, + padding='same', + kernel_size=3, + ), # c x l | n x c x l + nn.BatchNorm1d(inner_channels), # n x c | n x c x l + nn.ReLU(), + ) + seq = next(iter(self.conv_branch.modules())) + idx = [0, 4, 8] + for i in idx: + torch.nn.init.kaiming_uniform_(seq[i].weight.data) + + def forward(self, x, hidden_state=None): + x_lstm, hidden_state = self.lstm(x, hidden_state) # n x input_ch x inner_size + x_conv = self.conv_branch(x) # n x inner_ch x len + x = torch.cat([torch.flatten(x_lstm, start_dim=1), torch.flatten(x_conv, start_dim=1)], dim=-1) + x = F.softmax(self.proj(x)) + return x#, hidden_state + + def augment_zero_padding(self, X: torch.Tensor): + res = [] + for i in self.prediction_idx: + zeroed_X = X[...] + zeroed_X[..., i + 1:] = 0 + res.append(zeroed_X) + res = torch.concat(res, 0) + return res[torch.randperm(res.size(0)), ...] + +class MLSTM(BaseNeuralModel): + def __init__(self, params: Optional[OperationParameters] = None): + if params is None: + params = {} + super().__init__() + # self.num_classes = params.get('num_classes', None) + # self.epochs = params.get('epochs', 100) + # self.batch_size = params.get('batch_size', 16) + # self.activation = params.get('activation', 'ReLU') + # self.learning_rate = 0.001 + + self.dropout = params.get('dropout', 0.25) + self.hidden_size = params.get('hidden_size', 64) + self.hidden_channels = params.get('hidden_channels', 32) + self.num_layers = params.get('num_layers', 2) + # self.target = None + # self.task_type = None + self.interval_percentage = params.get('interval_percentage', 10) + self.min_ts_length = params.get('min_ts_length', 5) + + def _compute_prediction_points(self, n_idx): + interval_length = max(int(n_idx * self.interval_percentage / 100), self.min_ts_length) + prediction_idx = np.arange(0, n_idx, interval_length) + self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 + return prediction_idx + + def _init_model(self, ts: InputData): + _, input_channels, input_size = ts.features.shape + self.prediction_idx = self._compute_prediction_points(input_size) + self.model = MLSTM_module(input_size, input_channels, + self.hidden_size, self.hidden_channels, + self.num_classes, self.num_layers, + self.dropout) + self.model_for_inference = MLSTM_module(input_size, input_channels, + self.hidden_size, self.hidden_channels, + self.num_classes, self.num_layers, + self.dropout) + optimizer = optim.Adam(self.model.parameters(), lr=0.001) + if ts.num_classes == 2: + loss_fn = CROSS_ENTROPY() + else: + loss_fn = MULTI_CLASS_CROSS_ENTROPY() + return loss_fn, optimizer + + def _train_loop(self, train_loader, val_loader, loss_fn, optimizer): + return super()._train_loop(train_loader, val_loader, loss_fn, optimizer) + + @convert_to_3d_torch_array + def _fit_model(self, ts: InputData): + if isinstance(ts, torch.Tensor): + ts = self.augment_zero_padding(ts) + else: + print(type(ts)) + loss_fn, optimizer = self._init_model(ts) + train_loader, val_loader = self._prepare_data(ts, split_data=True) + self._train_loop( + train_loader=train_loader, + val_loader=val_loader, + loss_fn=loss_fn, + optimizer=optimizer + ) + + + + diff --git a/fedot_ind/core/repository/data/default_operation_params.json b/fedot_ind/core/repository/data/default_operation_params.json index 11980e4b4..98a7e2986 100644 --- a/fedot_ind/core/repository/data/default_operation_params.json +++ b/fedot_ind/core/repository/data/default_operation_params.json @@ -166,6 +166,10 @@ "learning_rate": "constant", "solver": "adam" }, + "mlstm_model": { + "epochs": 100, + "batch_size": 16 + }, "ar": { "lag_1": 7, "lag_2": 12, diff --git a/fedot_ind/core/repository/data/industrial_model_repository.json b/fedot_ind/core/repository/data/industrial_model_repository.json index ccbd1e0a7..42f58446a 100644 --- a/fedot_ind/core/repository/data/industrial_model_repository.json +++ b/fedot_ind/core/repository/data/industrial_model_repository.json @@ -370,6 +370,12 @@ "automl" ] }, + "mlstm_model": { + "meta": "fedot_NN_classification", + "presets": ["ts"], + "tags": [], + "input_type": "[DataTypesEnum.table]" + }, "xcm_model": { "meta": "fedot_NN_classification", "presets": [ diff --git a/fedot_ind/core/repository/model_repository.py b/fedot_ind/core/repository/model_repository.py index ac23c4f22..c7283a1bc 100644 --- a/fedot_ind/core/repository/model_repository.py +++ b/fedot_ind/core/repository/model_repository.py @@ -55,6 +55,7 @@ from fedot_ind.core.models.nn.network_impl.inception import InceptionTimeModel from fedot_ind.core.models.nn.network_impl.lora_nn import LoraModel from fedot_ind.core.models.nn.network_impl.mini_rocket import MiniRocketExtractor +from fedot_ind.core.models.nn.network_impl.mlstm import MLSTM from fedot_ind.core.models.nn.network_impl.nbeats import NBeatsModel from fedot_ind.core.models.nn.network_impl.resnet import ResNetModel from fedot_ind.core.models.nn.network_impl.tst import TSTModel @@ -193,7 +194,9 @@ class AtomizedModel(Enum): # linear_dummy_model 'dummy': DummyOverComplicatedNeuralNetwork, # linear_dummy_model - 'lora_model': LoraModel + 'lora_model': LoraModel, + # early ts classification + 'mlstm_model': MLSTM } From 7a2c477720a098a4668be1f61c368aa42818193d Mon Sep 17 00:00:00 2001 From: leostre Date: Tue, 9 Jul 2024 14:33:24 +0300 Subject: [PATCH 26/43] fitting w augmentation --- .../architecture/abstraction/decorators.py | 9 +- .../models/nn/network_impl/base_nn_model.py | 6 +- .../core/models/nn/network_impl/mlstm.py | 201 ++++-------------- 3 files changed, 55 insertions(+), 161 deletions(-) diff --git a/fedot_ind/core/architecture/abstraction/decorators.py b/fedot_ind/core/architecture/abstraction/decorators.py index 0b915c85c..3c01bb56d 100644 --- a/fedot_ind/core/architecture/abstraction/decorators.py +++ b/fedot_ind/core/architecture/abstraction/decorators.py @@ -11,9 +11,10 @@ def fedot_data_type(func): def decorated_func(self, *args): - if not isinstance(args[0], InputData): - args[0] = DataConverter(data=args[0]) - features = args[0].features + data, *rest_args = args + if not isinstance(data, InputData): + data = DataConverter(data=data) + features = data.features if len(features.shape) < 4: try: @@ -22,7 +23,7 @@ def decorated_func(self, *args): input_data_squeezed = np.squeeze(features) else: input_data_squeezed = features - return func(self, input_data_squeezed, args[1]) + return func(self, input_data_squeezed, *rest_args) return decorated_func diff --git a/fedot_ind/core/models/nn/network_impl/base_nn_model.py b/fedot_ind/core/models/nn/network_impl/base_nn_model.py index de83a2f06..e9d6c7274 100644 --- a/fedot_ind/core/models/nn/network_impl/base_nn_model.py +++ b/fedot_ind/core/models/nn/network_impl/base_nn_model.py @@ -90,7 +90,7 @@ def _fit_model(self, ts: InputData, split_data: bool = True): def _init_model(self, ts) -> tuple: raise NotImplementedError() - def _prepare_data(self, ts, split_data: bool = True): + def _prepare_data(self, ts, split_data: bool = True, collate_fn=None): if split_data: train_data, val_data = train_test_data_setup( @@ -102,13 +102,13 @@ def _prepare_data(self, ts, split_data: bool = True): val_dataset = None train_loader = torch.utils.data.DataLoader( - train_dataset, batch_size=self.batch_size, shuffle=True) + train_dataset, batch_size=self.batch_size, shuffle=True, collate_fn=collate_fn) if val_dataset is None: val_loader = val_dataset else: val_loader = torch.utils.data.DataLoader( - val_dataset, batch_size=self.batch_size, shuffle=True) + val_dataset, batch_size=self.batch_size, shuffle=True, collate_fn=collate_fn) self.label_encoder = train_dataset.label_encoder return train_loader, val_loader diff --git a/fedot_ind/core/models/nn/network_impl/mlstm.py b/fedot_ind/core/models/nn/network_impl/mlstm.py index 9a0a52ba6..612d2b11b 100644 --- a/fedot_ind/core/models/nn/network_impl/mlstm.py +++ b/fedot_ind/core/models/nn/network_impl/mlstm.py @@ -4,11 +4,13 @@ from fedot.core.data.data import InputData, OutputData from fedot_ind.core.repository.constanst_repository import CROSS_ENTROPY, MULTI_CLASS_CROSS_ENTROPY, RMSE import torch.optim as optim +from torch.optim import lr_scheduler import torch.nn as nn import torch.nn.functional as F import torch +from tqdm import tqdm from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array +from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array, fedot_data_type import pandas as pd from fedot.core.repository.tasks import Task, TaskTypesEnum, TsForecastingParams from fedot_ind.core.models.nn.network_modules.layers.special import adjust_learning_rate, EarlyStopping @@ -70,149 +72,19 @@ def __init__(self, input_size, input_channels, for i in idx: torch.nn.init.kaiming_uniform_(seq[i].weight.data) - def forward(self, x): - x_lstm, _ = self.lstm(x) # n x input_ch x inner_size - x_conv = self.conv_branch(x) # n x inner_ch x len - print(x_conv.size(), x_lstm.size()) - x = torch.cat([torch.flatten(x_lstm, start_dim=1), torch.flatten(x_conv, start_dim=1)], dim=-1) - x = F.softmax(self.proj(x)) - return x - - -class MLSTM(BaseNeuralModel): - def __init__(self, params: Optional[OperationParameters] = None): - if params is None: - params = {} - super().__init__() - # self.num_classes = params.get('num_classes', None) - # self.epochs = params.get('epochs', 100) - # self.batch_size = params.get('batch_size', 16) - # self.activation = params.get('activation', 'ReLU') - # self.learning_rate = 0.001 - - self.dropout = params.get('dropout', 0.25) - self.hidden_size = params.get('hidden_size', 64) - self.hidden_channels = params.get('hidden_channels', 32) - self.num_layers = params.get('num_layers', 2) - # self.target = None - # self.task_type = None - - def _init_model(self, ts: InputData): - _, input_channels, input_size = ts.features.shape - self.model = MLSTM_module(input_size, input_channels, - self.hidden_size, self.hidden_channels, - self.num_classes, self.num_layers, - self.dropout) - self.model_for_inference = MLSTM_module(input_size, input_channels, - self.hidden_size, self.hidden_channels, - self.num_classes, self.num_layers, - self.dropout) - optimizer = optim.Adam(self.model.parameters(), lr=0.001) - if ts.num_classes == 2: - loss_fn = CROSS_ENTROPY() - else: - loss_fn = MULTI_CLASS_CROSS_ENTROPY() - return loss_fn, optimizer - - @convert_to_3d_torch_array - def _fit_model(self, ts: InputData): - loss_fn, optimizer = self._init_model(ts) - train_loader, val_loader = self._prepare_data(ts, split_data=True) - self._train_loop( - train_loader=train_loader, - val_loader=val_loader, - loss_fn=loss_fn, - optimizer=optimizer - ) - - -from fedot_ind.core.models.nn.network_impl.base_nn_model import BaseNeuralModel -from typing import Optional, Callable, Any, List, Union -from fedot.core.operations.operation_parameters import OperationParameters -from fedot.core.data.data import InputData, OutputData -from fedot_ind.core.repository.constanst_repository import CROSS_ENTROPY, MULTI_CLASS_CROSS_ENTROPY, RMSE -import torch.optim as optim -import torch.nn as nn -import torch.nn.functional as F -import torch -from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array -import pandas as pd -from fedot.core.repository.tasks import Task, TaskTypesEnum, TsForecastingParams -from fedot_ind.core.models.nn.network_modules.layers.special import adjust_learning_rate, EarlyStopping -from fedot.core.repository.dataset_types import DataTypesEnum -from fedot_ind.core.architecture.preprocessing.data_convertor import DataConverter -import torch.utils.data as data -from fedot_ind.core.architecture.settings.computational import default_device - -class SqueezeExciteBlock(nn.Module): - def __init__(self, input_channels, filters, reduce=4): - super().__init__() - self.filters = filters - self.pool = nn.AvgPool1d(input_channels) - self.bottleneck = max(self.filters // reduce, 4) - self.fc1 = nn.Linear(self.filters, self.bottleneck, bias=False) - self.fc2 = nn.Linear(self.bottleneck, self.filters, bias=False) - torch.nn.init.kaiming_normal_(self.fc1.weight.data) - torch.nn.init.kaiming_normal_(self.fc2.weight.data) - - def forward(self, x): - input_x = x - x = self.pool(x) - x = F.relu(self.fc1(x.view(-1, 1, self.filters))) - x = F.sigmoid(self.fc2(x)) - x = x.view(-1, self.filters, 1) * input_x - return x - -class MLSTM_module(nn.Module): - def __init__(self, input_size, input_channels, - inner_size, inner_channels, - output_size, num_layers, dropout=0.25): - super().__init__() - self.proj = nn.Linear(input_size * inner_channels + input_channels * inner_size, output_size) - self.lstm = nn.LSTM(input_size, inner_size, num_layers, - batch_first=True, dropout=dropout) - self.conv_branch = nn.Sequential( - nn.Conv1d(input_channels, inner_channels, - padding='same', - kernel_size=9), - nn.BatchNorm1d(inner_channels), - nn.ReLU(), - SqueezeExciteBlock(input_size, inner_channels), - nn.Conv1d(inner_channels, inner_channels * 2, - padding='same', - kernel_size=5, - ), # c x l | n x c x l - nn.BatchNorm1d(inner_channels * 2), # n x c | n x c x l - nn.ReLU(), - SqueezeExciteBlock(input_size, inner_channels * 2), - nn.Conv1d(inner_channels * 2, inner_channels, - padding='same', - kernel_size=3, - ), # c x l | n x c x l - nn.BatchNorm1d(inner_channels), # n x c | n x c x l - nn.ReLU(), - ) - seq = next(iter(self.conv_branch.modules())) - idx = [0, 4, 8] - for i in idx: - torch.nn.init.kaiming_uniform_(seq[i].weight.data) - - def forward(self, x, hidden_state=None): + def forward(self, x, hidden_state=None, return_hidden_state=False): + # hidden_state = hidden_state or self.hidden_state + if not self.training: + print(x.shape) x_lstm, hidden_state = self.lstm(x, hidden_state) # n x input_ch x inner_size x_conv = self.conv_branch(x) # n x inner_ch x len x = torch.cat([torch.flatten(x_lstm, start_dim=1), torch.flatten(x_conv, start_dim=1)], dim=-1) x = F.softmax(self.proj(x)) + # self.hidden_state = hidden_state + if return_hidden_state: + return x, hidden_state return x#, hidden_state - def augment_zero_padding(self, X: torch.Tensor): - res = [] - for i in self.prediction_idx: - zeroed_X = X[...] - zeroed_X[..., i + 1:] = 0 - res.append(zeroed_X) - res = torch.concat(res, 0) - return res[torch.randperm(res.size(0)), ...] class MLSTM(BaseNeuralModel): def __init__(self, params: Optional[OperationParameters] = None): @@ -229,11 +101,19 @@ def __init__(self, params: Optional[OperationParameters] = None): self.hidden_size = params.get('hidden_size', 64) self.hidden_channels = params.get('hidden_channels', 32) self.num_layers = params.get('num_layers', 2) - # self.target = None - # self.task_type = None self.interval_percentage = params.get('interval_percentage', 10) self.min_ts_length = params.get('min_ts_length', 5) + def __repr__(self): + return 'MLSTM' + + @convert_to_3d_torch_array + def _predict_model(self, ts: InputData, output_mode='default'): + self.model.eval() + x_test = torch.Tensor(ts).to(self._device) + pred = self.model(x_test) + return self._convert_predict(pred, output_mode) + def _compute_prediction_points(self, n_idx): interval_length = max(int(n_idx * self.interval_percentage / 100), self.min_ts_length) prediction_idx = np.arange(0, n_idx, interval_length) @@ -241,7 +121,7 @@ def _compute_prediction_points(self, n_idx): return prediction_idx def _init_model(self, ts: InputData): - _, input_channels, input_size = ts.features.shape + *_, input_channels, input_size = ts.features.shape self.prediction_idx = self._compute_prediction_points(input_size) self.model = MLSTM_module(input_size, input_channels, self.hidden_size, self.hidden_channels, @@ -255,27 +135,40 @@ def _init_model(self, ts: InputData): if ts.num_classes == 2: loss_fn = CROSS_ENTROPY() else: - loss_fn = MULTI_CLASS_CROSS_ENTROPY() + loss_fn = CROSS_ENTROPY() return loss_fn, optimizer - def _train_loop(self, train_loader, val_loader, loss_fn, optimizer): - return super()._train_loop(train_loader, val_loader, loss_fn, optimizer) + # @convert_to_3d_torch_array + # def predict(self, ts: InputData, output_mode: str = 'default'): + # return super().predict(ts, output_mode) + + # def predict_for_fit(self, ts: InputData, output_mode: str = 'default'): + # return super().predict_for_fit(ts, output_mode) @convert_to_3d_torch_array - def _fit_model(self, ts: InputData): - if isinstance(ts, torch.Tensor): - ts = self.augment_zero_padding(ts) - else: - print(type(ts)) + def _fit_model(self, ts: InputData, mode='zero_padding'): + self.epochs = 1 # !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!1 loss_fn, optimizer = self._init_model(ts) - train_loader, val_loader = self._prepare_data(ts, split_data=True) + + train_loader, val_loader = self._prepare_data(ts, split_data=False, + collate_fn=getattr(self, '_augment_zero_padding')) self._train_loop( train_loader=train_loader, val_loader=val_loader, loss_fn=loss_fn, - optimizer=optimizer + optimizer=optimizer, ) - - - + def _augment_zero_padding(self, batch,): + prediction_idx = self.prediction_idx + x, y = zip(*batch) + X, y = torch.stack(x), torch.stack(y) + y = np.tile(y, (len(prediction_idx), 1)) + res = [] + for i in prediction_idx: + zeroed_X = X[...] + zeroed_X[..., i + 1:] = 0 + res.append(zeroed_X) + res = np.concatenate(res, 0) + perm = np.random.permutation(res.shape[0]) + return torch.tensor(res[perm, ...]), torch.tensor(y[perm]) From 370eb28e1b5b77274d4c2039c07ca7f5f96b0356 Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 12 Jul 2024 01:27:24 +0300 Subject: [PATCH 27/43] all work, but need eval --- .../core/models/early_tc/base_early_tc.py | 3 + fedot_ind/core/models/early_tc/ecec.py | 61 +++++++++++++------ fedot_ind/core/models/early_tc/economy_k.py | 21 +++++-- .../core/models/early_tc/prob_threshold.py | 29 ++++++--- fedot_ind/core/models/early_tc/teaser.py | 19 ++++-- 5 files changed, 93 insertions(+), 40 deletions(-) diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index 5e180c2a9..38e5fd23f 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -71,6 +71,9 @@ def _select_estimators(self, X, training=False): elif training or self.prediction_mode == 'all': last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) estimator_indices = np.arange(last_idx + 1) + elif 'last_available': + last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) + estimator_indices = [last_idx] else: raise ValueError('Unknown prediction mode') return estimator_indices, offset diff --git a/fedot_ind/core/models/early_tc/ecec.py b/fedot_ind/core/models/early_tc/ecec.py index 45f7f9fe4..00962a233 100644 --- a/fedot_ind/core/models/early_tc/ecec.py +++ b/fedot_ind/core/models/early_tc/ecec.py @@ -9,6 +9,7 @@ class ECEC(BaseETC): def __init__(self, params: Optional[OperationParameters] = None): super().__init__(params) + self.__cv = 5 def _init_model(self, X, y): super()._init_model(X, y) @@ -30,34 +31,39 @@ def predict(self, X): predicted_labels, _, non_confident, confidences = self._predict(X) predicted_labels = np.stack(predicted_labels) predicted_labels[non_confident] = -1 - return predicted_labels, confidences + if self.transform_score: + confidences = self._transform_score(confidences) + return self._remove_first_1d(predicted_labels, confidences) def predict_proba(self, X): _, predicted_probas, non_confident, confidences = self._predict(X) predicted_probas = np.stack(predicted_probas) predicted_probas[non_confident] = -1 - return predicted_probas, confidences + if self.transform_score: + confidences = self._transform_score(confidences) + return self._remove_first_1d(predicted_probas, confidences) + + def _fit_one_interval(self, X, y, i): + X_part = X[..., :self.prediction_idx[i] + 1] + X_part = self.scalers[i].fit_transform(X_part) + self.slave_estimators[i].fit(X_part, y) + labels = cross_val_predict(self.slave_estimators[i], X_part, y, cv=self.__cv) + return labels - def _score(self, X, y, alpha, training=False): - y = y.astype(int) - predicted_labels, *_ = super()._predict(X, training) # n_pred x n_inst - predicted_labels = np.stack(predicted_labels) - n = predicted_labels.shape[0] - accuracies = (predicted_labels == np.tile(y, (n, 1))) # n_pred x n_inst - confidences = np.ones((n, X.shape[0]), dtype='float32') - for i in range(n): - y_pred = predicted_labels[i] - reliability_i = confusion_matrix(y, y_pred, normalize='pred') - confidences[i] = 1 - reliability_i[y, y_pred] # n_inst - self._reliabilities[i] = reliability_i - confidences = 1 - np.cumprod(confidences, axis=0) # n_pred x n_inst + def _score(self, y, y_pred, alpha): + matches = (y_pred == np.tile(y, (self.n_pred, 1))) # n_pred x n_inst + n, n_inst = matches.shape[:2] + confidences = np.ones((n, n_inst), dtype='float32') + for i in range(self.n_pred): + confidences[i] = self._reliabilities[i, y, y_pred[i]] + confidences = 1 - np.cumprod(1 - confidences, axis=0) # n_pred x n_inst candidates = self._select_thrs(confidences) # n_candidates cfs = np.zeros((len(candidates), n)) for i, candidate in enumerate(candidates): mask = confidences >= candidate # n_pred x n_inst - accuracy_for_candidate = (accuracies * mask).sum(1) / mask.sum(1) # n_pred + accuracy_for_candidate = (matches * mask).sum(1) / mask.sum(1) # n_pred cfs[i] = self.cost_func(self.earliness, accuracy_for_candidate, alpha) - self._best_estimator_idx = np.argmin(cfs.mean(0)) + self._chosen_estimator_idx = np.argmin(cfs.mean(0)) return candidates[np.argmin(cfs, axis=0)] # n_pred @staticmethod @@ -75,6 +81,23 @@ def cost_func(earliness, accuracies, alpha): return alpha * (1 - accuracies) + (1 - alpha) * earliness def fit(self, X, y): - super().fit(X, y) - self.confidence_thresholds = self._score(X, y, self.accuracy_importance, training=True) + y = np.array(y).flatten().astype(int) + self._init_model(X, y) + labels = [] + for i in range(self.n_pred): + labels.append(self._fit_one_interval(X, y, i)) + predicted_labels = np.stack(labels) + for i in range(self.n_pred): + y_pred = predicted_labels[i] + reliability_i = confusion_matrix(y, y_pred, normalize='pred') + self._reliabilities[i] = reliability_i + self.confidence_thresholds = self._score(y, predicted_labels, self.accuracy_importance) + + def _transform_score(self, confidences): + thr = self.confidence_thresholds[self._estimator_for_predict[-1]] + confidences = confidences - thr + positive = confidences > 0 + confidences[positive] *= 1 / (1 - thr) + confidences[~positive] *= 1 / thr + return confidences \ No newline at end of file diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py index 639e680cd..8eb207550 100644 --- a/fedot_ind/core/models/early_tc/economy_k.py +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -11,8 +11,10 @@ def __init__(self, params: Optional[OperationParameters] = None): if params is None: params = {} super().__init__(params) + self.prediction_mode = params.get('prediction_mode', 'last_available') self.lambda_ = params.get('lambda', 1.) self._cluster_factor = params.get('cluster_factor' , 1) + # self.confidence_mode = params.get('confidence_mode', 'time') # or 'confidence' self._random_state = 2104 self.__cv = 5 @@ -77,13 +79,20 @@ def _get_prediction_time(self, X, cluster_centroids, i): def predict_proba(self, X): probas, times, is_optimal = self._predict(X) is_optimal = np.stack(is_optimal) - idx = np.tile(np.arange(self.n_pred), (is_optimal.shape[1], 1)).T # n_pred x n_inst - idx[~is_optimal] = self.n_pred - idx = np.argmin(idx, 0) - probas = np.stack(probas) - return probas[idx], np.stack(times)[idx] + probas, times = np.stack(probas), np.stack(times) + if self.transform_score: + times = self._transform_score(times) + return self._remove_first_1d(probas, times) def predict(self, X): probas, times = self.predict_proba(X) labels = probas.argmax(-1) - return labels, times + return self._remove_first_1d(labels, times) + + def _transform_score(self, time): + idx = self._estimator_for_predict[-1] + scores = -(1 - (time - self.prediction_idx[idx]) / self.prediction_idx[-1]) + scores[scores == 0] = 1 # no posibility for lininterp when sure + return scores + + diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index 51d169909..8dcb8828f 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -7,7 +7,7 @@ class ProbabilityThresholdClassifier(BaseETC): def __init__(self, params: Optional[OperationParameters] = None): if params is None: params = {} - super().__init__() + super().__init__(params) self.probability_threshold = params.get('probability_threshold', None) def _init_model(self, X, y): @@ -18,19 +18,23 @@ def _init_model(self, X, y): def predict_proba(self, X): _, predicted_probas, non_acceptance = self._predict(X) predicted_probas[non_acceptance] = 0 - return predicted_probas.squeeze() + scores = predicted_probas.max(-1) + if self.transform_score: + scores = self._transform_score(scores) + return self._remove_first_1d(predicted_probas, scores) def predict(self, X): - predicted_labels, _, non_acceptance = self._predict(X, training=False) + predicted_labels, predicted_probas, non_acceptance = self._predict(X, training=False) predicted_labels[non_acceptance] = -1 - # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] - return predicted_labels # prediction_points x n_instances + scores = predicted_probas.max(-1) + if self.transform_score: + scores = self._transform_score(scores) + return self._remove_first_1d(predicted_labels, scores) # (prediction_points x) n_instances def _predict(self, X, training=True): predicted_probas, predicted_labels = super()._predict(X, training) predicted_probas = np.stack(predicted_probas) predicted_labels = np.stack(predicted_labels) - # print(predicted_labels.shape, predicted_probas.shape) non_acceptance = self._consecutive_count(predicted_labels) < self.consecutive_predictions double_check = predicted_probas.max(axis=-1) > self.probability_threshold non_acceptance[non_acceptance & double_check] = False @@ -38,10 +42,17 @@ def _predict(self, X, training=True): def _score(self, X, y, accuracy_importance=None): scores = super()._score(X, y, accuracy_importance) - self._best_estimator_idx = np.argmax(scores) + self._chosen_estimator_idx = np.argmax(scores) return scores def fit(self, X, y): super().fit(X, y) - return self._score(X, y, self.accuracy_importance) - + self._score(X, y, self.accuracy_importance) + + def _transform_score(self, confidences): + thr = self.probability_threshold + confidences = confidences - thr + positive = confidences > 0 + confidences[positive] *= 1 / (1 - thr) + confidences[~positive] *= 1 / thr + return confidences diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index c03c5d1e6..10d36e5a0 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -54,31 +54,38 @@ def _predict(self, X): # for each point of estimation for i in range(predicted_labels.shape[0]): # find not accepted points - ith_point_to_oc = to_oc_check[to_oc_check[:, 0] == i, 1] - X_to_ith = X_ocs[i][ith_point_to_oc] + X_to_ith = X_ocs[i] # if they are not outliers final_verdict = self.oc_estimators[estimator_indices[i]].decision_function(X_to_ith) # 1 for accept -1 for reject # mark as accepted - non_acceptance[i, np.argwhere(final_verdict >= 0).flatten()] = False + # non_acceptance[i, np.argwhere(final_verdict >= 0).flatten()] = False final_verdicts[i] = final_verdict + non_acceptance[non_acceptance & (final_verdict > 0)] = False return predicted_labels, predicted_probas, non_acceptance, final_verdicts def predict_proba(self, X): _, predicted_probas, non_acceptance, final_verdicts = self._predict(X) predicted_probas[non_acceptance] = final_verdicts[non_acceptance, None] - return predicted_probas.squeeze() + if self.transform_score: + final_verdicts = self._transform_score(final_verdicts) + return self._remove_first_1d(predicted_probas, final_verdicts) def predict(self, X): predicted_labels, _, non_acceptance, final_verdicts = self._predict(X) predicted_labels[non_acceptance] = -1 # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] - return predicted_labels # prediction_points x n_instances + if self.transform_score: + final_verdicts = self._transform_score(final_verdicts) + return self._remove_first_1d(predicted_labels, final_verdicts) # (prediction_points x) n_instances def _score(self, X, y, accuracy_importance=None): scores = super()._score(X, y, accuracy_importance) - self._best_estimator_idx = np.argmax(scores) + self._chosen_estimator_idx = np.argmax(scores) return scores def fit(self, X, y): super().fit(X, y) return self._score(X, y, self.accuracy_importance) + + def _transform_score(self, scores): + return np.tanh(scores) From e51949b65ee4a047b6536e7eb15861faab6297e5 Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 12 Jul 2024 12:09:39 +0300 Subject: [PATCH 28/43] evth converged to one interface + refactored --- .../core/models/early_tc/base_early_tc.py | 53 ++-- fedot_ind/core/models/early_tc/ecec.py | 18 +- fedot_ind/core/models/early_tc/economy_k.py | 15 +- .../core/models/early_tc/prob_threshold.py | 14 +- fedot_ind/core/models/early_tc/teaser.py | 22 +- .../core/models/nn/network_impl/mlstm.py | 235 ++++++++++++------ .../data/default_operation_params.json | 14 +- .../data/industrial_model_repository.json | 22 +- fedot_ind/core/repository/model_repository.py | 8 +- fedot_ind/core/tuning/search_space.py | 32 ++- 10 files changed, 280 insertions(+), 153 deletions(-) diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index 38e5fd23f..9fbc162c5 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -11,10 +11,12 @@ def __init__(self, params: Optional[OperationParameters] = None): if params is None: params = {} super().__init__() - self.prediction_mode = params.get('prediction_mode', 'best_by_harmonic_mean') self.interval_percentage = params.get('interval_percentage', 10) - self.consecutive_predictions = params.get('consecutive_predictions', 3) + self.consecutive_predictions = params.get('consecutive_predictions', 1) self.accuracy_importance = params.get('accuracy_importance', 1.) + + self.prediction_mode = params.get('prediction_mode', 'last_available') + self.transform_score = params.get('transform_score', True) self.min_ts_length = params.get('min_ts_step', 3) self.random_state = params.get('random_state', None) self.weasel_params = {} @@ -26,14 +28,15 @@ def _init_model(self, X, y): self.n_pred = len(self.prediction_idx) self.slave_estimators = [WEASEL(random_state=self.random_state, support_probabilities=True, **self.weasel_params) for _ in range(self.n_pred)] self.scalers = [StandardScaler() for _ in range(self.n_pred)] - self._best_estimator_idx = -1 + self._chosen_estimator_idx = -1 self.classes_ = [np.unique(y)] + self._estimator_for_predict = [-1] @property def required_length(self): - if not hasattr(self, '_best_estimator_idx'): + if not hasattr(self, '_chosen_estimator_idx'): return None - return self.prediction_idx[self._best_estimator_idx] + return self.prediction_idx[self._chosen_estimator_idx] @property def n_classes(self): @@ -47,7 +50,7 @@ def fit(self, X, y=None): self._fit_one_interval(X, y, i) def _fit_one_interval(self, X, y, i): - X_part = X[..., :self.prediction_idx[i] + 1] # what's dimensionality of input? will it work in case of multivariate? + X_part = X[..., :self.prediction_idx[i] + 1] X_part = self.scalers[i].fit_transform(X_part) probas = self.slave_estimators[i].fit_predict_proba(X_part, y) return probas @@ -67,19 +70,21 @@ def _compute_prediction_points(self, n_idx): def _select_estimators(self, X, training=False): offset = 0 if not training and self.prediction_mode == 'best_by_harmonic_mean': - estimator_indices = [self._best_estimator_idx] + estimator_indices = [self._chosen_estimator_idx] + elif not training and self.prediction_mode == 'last_available': + last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) + estimator_indices = [last_idx] elif training or self.prediction_mode == 'all': last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) estimator_indices = np.arange(last_idx + 1) - elif 'last_available': - last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) - estimator_indices = [last_idx] else: raise ValueError('Unknown prediction mode') return estimator_indices, offset def _predict(self, X, training=True): estimator_indices, offset = self._select_estimators(X, training) + if not training: + self._estimator_for_predict = estimator_indices prediction = zip( *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary ) @@ -94,20 +99,32 @@ def _consecutive_count(self, predicted_labels: List[np.array]): consecutive_labels[i, equal] = consecutive_labels[i - 1, equal] + 1 return consecutive_labels # prediction_points x n_instances - def predict_proba(self, X): - raise NotImplementedError + def predict_proba(self, *args): + predicted_probas, scores, *_ = args + if self.transform_score: + scores = self._transform_score(scores) + scores = np.tile(scores[..., None], (1, 1, self.n_classes)) + prediction = np.stack([predicted_probas, scores], axis=0) + if prediction.shape[1] == 1: + prediction = prediction.squeeze(1) + return prediction def predict(self, X): - raise NotImplementedError + prediction = self.predict_proba(X) + labels = prediction[0:1].argmax(-1) + scores = prediction[1:2, ..., 0] + prediction = np.stack([labels, scores], 0) + if prediction.shape[1] == 1: + prediction = prediction.squeeze(1) + return prediction - def _score(self, X, y, hm_shift_to_acc=None): + def _score(self, X, y, accuracy_importance=None, training=True): y = np.array(y).flatten() - hm_shift_to_acc = hm_shift_to_acc or self.accuracy_importance - predictions = self._predict(X)[0] + accuracy_importance = accuracy_importance or self.accuracy_importance + predictions = self._predict(X, training)[0] prediction_points = predictions.shape[0] accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) - return (1 + hm_shift_to_acc) * accuracies * self.earliness[:prediction_points] / (hm_shift_to_acc * accuracies + self.earliness[:prediction_points]) - + return (1 + accuracy_importance) * accuracies * self.earliness[:prediction_points] / (accuracy_importance * accuracies + self.earliness[:prediction_points]) def _get_applicable_index(self, last_available_idx): idx = np.searchsorted(self.prediction_idx, last_available_idx, side='right') diff --git a/fedot_ind/core/models/early_tc/ecec.py b/fedot_ind/core/models/early_tc/ecec.py index 00962a233..f6e163d25 100644 --- a/fedot_ind/core/models/early_tc/ecec.py +++ b/fedot_ind/core/models/early_tc/ecec.py @@ -3,7 +3,6 @@ from fedot.core.operations.operation_parameters import OperationParameters from fedot_ind.core.models.early_tc.base_early_tc import BaseETC from sklearn.model_selection import cross_val_predict -from sklearn.base import clone from sklearn.metrics import confusion_matrix class ECEC(BaseETC): @@ -25,23 +24,14 @@ def _predict(self, X, training=False): reliabilities = np.stack(reliabilities) confidences = 1 - np.cumprod(1 - reliabilities, axis=0) non_confident = confidences < self.confidence_thresholds[:len(predicted_labels), None] - return predicted_labels, predicted_probas, non_confident, confidences - - def predict(self, X): - predicted_labels, _, non_confident, confidences = self._predict(X) predicted_labels = np.stack(predicted_labels) - predicted_labels[non_confident] = -1 - if self.transform_score: - confidences = self._transform_score(confidences) - return self._remove_first_1d(predicted_labels, confidences) + predicted_probas = np.stack(predicted_probas) + return predicted_labels, predicted_probas, non_confident, confidences def predict_proba(self, X): _, predicted_probas, non_confident, confidences = self._predict(X) - predicted_probas = np.stack(predicted_probas) predicted_probas[non_confident] = -1 - if self.transform_score: - confidences = self._transform_score(confidences) - return self._remove_first_1d(predicted_probas, confidences) + return super().predict_proba(predicted_probas, confidences) def _fit_one_interval(self, X, y, i): X_part = X[..., :self.prediction_idx[i] + 1] @@ -52,7 +42,7 @@ def _fit_one_interval(self, X, y, i): def _score(self, y, y_pred, alpha): matches = (y_pred == np.tile(y, (self.n_pred, 1))) # n_pred x n_inst - n, n_inst = matches.shape[:2] + n, n_inst, *_ = matches.shape confidences = np.ones((n, n_inst), dtype='float32') for i in range(self.n_pred): confidences[i] = self._reliabilities[i, y, y_pred[i]] diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py index 8eb207550..bf09acd4b 100644 --- a/fedot_ind/core/models/early_tc/economy_k.py +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -4,7 +4,7 @@ from fedot_ind.core.models.early_tc.base_early_tc import BaseETC from sklearn.cluster import KMeans from sklearn.metrics import confusion_matrix -from sklearn.model_selection import train_test_split, cross_val_predict +from sklearn.model_selection import cross_val_predict class EconomyK(BaseETC): def __init__(self, params: Optional[OperationParameters] = None): @@ -14,7 +14,6 @@ def __init__(self, params: Optional[OperationParameters] = None): self.prediction_mode = params.get('prediction_mode', 'last_available') self.lambda_ = params.get('lambda', 1.) self._cluster_factor = params.get('cluster_factor' , 1) - # self.confidence_mode = params.get('confidence_mode', 'time') # or 'confidence' self._random_state = 2104 self.__cv = 5 @@ -77,17 +76,9 @@ def _get_prediction_time(self, X, cluster_centroids, i): return time_optimal, is_optimal # n_inst def predict_proba(self, X): - probas, times, is_optimal = self._predict(X) - is_optimal = np.stack(is_optimal) + probas, times, _ = self._predict(X, training=False) probas, times = np.stack(probas), np.stack(times) - if self.transform_score: - times = self._transform_score(times) - return self._remove_first_1d(probas, times) - - def predict(self, X): - probas, times = self.predict_proba(X) - labels = probas.argmax(-1) - return self._remove_first_1d(labels, times) + return super().predict_proba(probas, times) def _transform_score(self, time): idx = self._estimator_for_predict[-1] diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index 8dcb8828f..773f79d8e 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -16,20 +16,10 @@ def _init_model(self, X, y): self.probability_threshold = 1 / len(self.classes_[0]) def predict_proba(self, X): - _, predicted_probas, non_acceptance = self._predict(X) + _, predicted_probas, non_acceptance = self._predict(X, training=False) predicted_probas[non_acceptance] = 0 scores = predicted_probas.max(-1) - if self.transform_score: - scores = self._transform_score(scores) - return self._remove_first_1d(predicted_probas, scores) - - def predict(self, X): - predicted_labels, predicted_probas, non_acceptance = self._predict(X, training=False) - predicted_labels[non_acceptance] = -1 - scores = predicted_probas.max(-1) - if self.transform_score: - scores = self._transform_score(scores) - return self._remove_first_1d(predicted_labels, scores) # (prediction_points x) n_instances + return super().predict_proba(predicted_probas, scores) def _predict(self, X, training=True): predicted_probas, predicted_labels = super()._predict(X, training) diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 10d36e5a0..23d6c078d 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -1,9 +1,9 @@ from typing import Optional from fedot_ind.core.architecture.settings.computational import backend_methods as np -from sklearn.svm import OneClassSVM -from sklearn.model_selection import GridSearchCV from fedot.core.operations.operation_parameters import OperationParameters from fedot_ind.core.models.early_tc.base_early_tc import BaseETC +from sklearn.model_selection import GridSearchCV +from sklearn.svm import OneClassSVM class TEASER(BaseETC): @@ -40,13 +40,12 @@ def _form_X_oc(self, predicted_probas): d = d.min(axis=-1).reshape(-1, 1) return np.hstack([predicted_probas, d]) - def _predict(self, X): + def _predict(self, X, training=False): estimator_indices, offset = self._select_estimators(X) X_ocs, predicted_probas, predicted_labels = zip( *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary ) non_acceptance = self._consecutive_count(predicted_labels) < self.consecutive_predictions - to_oc_check = np.argwhere(non_acceptance) X_ocs = np.stack(X_ocs) predicted_probas = np.stack(predicted_probas) predicted_labels = np.stack(predicted_labels) @@ -56,9 +55,8 @@ def _predict(self, X): # find not accepted points X_to_ith = X_ocs[i] # if they are not outliers - final_verdict = self.oc_estimators[estimator_indices[i]].decision_function(X_to_ith) # 1 for accept -1 for reject + final_verdict = self.oc_estimators[estimator_indices[i]].decision_function(X_to_ith) # mark as accepted - # non_acceptance[i, np.argwhere(final_verdict >= 0).flatten()] = False final_verdicts[i] = final_verdict non_acceptance[non_acceptance & (final_verdict > 0)] = False return predicted_labels, predicted_probas, non_acceptance, final_verdicts @@ -66,17 +64,7 @@ def _predict(self, X): def predict_proba(self, X): _, predicted_probas, non_acceptance, final_verdicts = self._predict(X) predicted_probas[non_acceptance] = final_verdicts[non_acceptance, None] - if self.transform_score: - final_verdicts = self._transform_score(final_verdicts) - return self._remove_first_1d(predicted_probas, final_verdicts) - - def predict(self, X): - predicted_labels, _, non_acceptance, final_verdicts = self._predict(X) - predicted_labels[non_acceptance] = -1 - # predicted_labels[non_acceptance] = final_verdicts[non_acceptance] - if self.transform_score: - final_verdicts = self._transform_score(final_verdicts) - return self._remove_first_1d(predicted_labels, final_verdicts) # (prediction_points x) n_instances + return super().predict_proba(predicted_probas, final_verdicts) def _score(self, X, y, accuracy_importance=None): scores = super()._score(X, y, accuracy_importance) diff --git a/fedot_ind/core/models/nn/network_impl/mlstm.py b/fedot_ind/core/models/nn/network_impl/mlstm.py index 612d2b11b..3e1d3c4b5 100644 --- a/fedot_ind/core/models/nn/network_impl/mlstm.py +++ b/fedot_ind/core/models/nn/network_impl/mlstm.py @@ -1,23 +1,20 @@ +import copy from fedot_ind.core.models.nn.network_impl.base_nn_model import BaseNeuralModel from typing import Optional, Callable, Any, List, Union from fedot.core.operations.operation_parameters import OperationParameters from fedot.core.data.data import InputData, OutputData from fedot_ind.core.repository.constanst_repository import CROSS_ENTROPY, MULTI_CLASS_CROSS_ENTROPY, RMSE import torch.optim as optim -from torch.optim import lr_scheduler +import torch.optim.lr_scheduler as lr_scheduler import torch.nn as nn import torch.nn.functional as F import torch -from tqdm import tqdm +from tqdm import tqdm from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array, fedot_data_type +from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array import pandas as pd -from fedot.core.repository.tasks import Task, TaskTypesEnum, TsForecastingParams from fedot_ind.core.models.nn.network_modules.layers.special import adjust_learning_rate, EarlyStopping -from fedot.core.repository.dataset_types import DataTypesEnum -from fedot_ind.core.architecture.preprocessing.data_convertor import DataConverter import torch.utils.data as data -from fedot_ind.core.architecture.settings.computational import default_device class SqueezeExciteBlock(nn.Module): def __init__(self, input_channels, filters, reduce=4): @@ -46,20 +43,22 @@ def __init__(self, input_size, input_channels, self.proj = nn.Linear(input_size * inner_channels + input_channels * inner_size, output_size) self.lstm = nn.LSTM(input_size, inner_size, num_layers, batch_first=True, dropout=dropout) + + squeeze_excite_size = input_size #if not interval else interval self.conv_branch = nn.Sequential( nn.Conv1d(input_channels, inner_channels, padding='same', kernel_size=9), nn.BatchNorm1d(inner_channels), nn.ReLU(), - SqueezeExciteBlock(input_size, inner_channels), + SqueezeExciteBlock(squeeze_excite_size, inner_channels), nn.Conv1d(inner_channels, inner_channels * 2, padding='same', kernel_size=5, ), # c x l | n x c x l nn.BatchNorm1d(inner_channels * 2), # n x c | n x c x l nn.ReLU(), - SqueezeExciteBlock(input_size, inner_channels * 2), + SqueezeExciteBlock(squeeze_excite_size, inner_channels * 2), nn.Conv1d(inner_channels * 2, inner_channels, padding='same', kernel_size=3, @@ -72,103 +71,197 @@ def __init__(self, input_size, input_channels, for i in idx: torch.nn.init.kaiming_uniform_(seq[i].weight.data) - def forward(self, x, hidden_state=None, return_hidden_state=False): - # hidden_state = hidden_state or self.hidden_state - if not self.training: - print(x.shape) + def forward(self, x, hidden_state=None, return_hidden=False): x_lstm, hidden_state = self.lstm(x, hidden_state) # n x input_ch x inner_size x_conv = self.conv_branch(x) # n x inner_ch x len x = torch.cat([torch.flatten(x_lstm, start_dim=1), torch.flatten(x_conv, start_dim=1)], dim=-1) x = F.softmax(self.proj(x)) - # self.hidden_state = hidden_state - if return_hidden_state: + if return_hidden: return x, hidden_state - return x#, hidden_state - + return x + class MLSTM(BaseNeuralModel): def __init__(self, params: Optional[OperationParameters] = None): if params is None: params = {} super().__init__() - # self.num_classes = params.get('num_classes', None) - # self.epochs = params.get('epochs', 100) - # self.batch_size = params.get('batch_size', 16) - # self.activation = params.get('activation', 'ReLU') - # self.learning_rate = 0.001 - self.dropout = params.get('dropout', 0.25) self.hidden_size = params.get('hidden_size', 64) self.hidden_channels = params.get('hidden_channels', 32) self.num_layers = params.get('num_layers', 2) self.interval_percentage = params.get('interval_percentage', 10) self.min_ts_length = params.get('min_ts_length', 5) - + self.fitting_mode = params.get('fitting_mode', 'zero_padding') + self.proba_thr = params.get('proba_thr', None) + def __repr__(self): return 'MLSTM' - @convert_to_3d_torch_array - def _predict_model(self, ts: InputData, output_mode='default'): - self.model.eval() - x_test = torch.Tensor(ts).to(self._device) - pred = self.model(x_test) - return self._convert_predict(pred, output_mode) - def _compute_prediction_points(self, n_idx): interval_length = max(int(n_idx * self.interval_percentage / 100), self.min_ts_length) - prediction_idx = np.arange(0, n_idx, interval_length) + prediction_idx = np.arange(interval_length - 1, n_idx, interval_length) self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 - return prediction_idx + return prediction_idx, interval_length def _init_model(self, ts: InputData): - *_, input_channels, input_size = ts.features.shape - self.prediction_idx = self._compute_prediction_points(input_size) - self.model = MLSTM_module(input_size, input_channels, + _, input_channels, input_size = ts.features.shape + self.input_size = input_size + self.prediction_idx, self.interval = self._compute_prediction_points(input_size) + self.model = MLSTM_module(input_size if self.fitting_mode != 'moving_window' else self.interval, + input_channels, self.hidden_size, self.hidden_channels, self.num_classes, self.num_layers, self.dropout) - self.model_for_inference = MLSTM_module(input_size, input_channels, + self.model_for_inference = MLSTM_module(input_size if self.fitting_mode != 'moving_window' else self.interval, + input_channels, self.hidden_size, self.hidden_channels, self.num_classes, self.num_layers, self.dropout) optimizer = optim.Adam(self.model.parameters(), lr=0.001) - if ts.num_classes == 2: - loss_fn = CROSS_ENTROPY() - else: - loss_fn = CROSS_ENTROPY() + loss_fn = CROSS_ENTROPY() return loss_fn, optimizer - # @convert_to_3d_torch_array - # def predict(self, ts: InputData, output_mode: str = 'default'): - # return super().predict(ts, output_mode) - - # def predict_for_fit(self, ts: InputData, output_mode: str = 'default'): - # return super().predict_for_fit(ts, output_mode) - @convert_to_3d_torch_array - def _fit_model(self, ts: InputData, mode='zero_padding'): - self.epochs = 1 # !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!1 + def _fit_model(self, ts: InputData): + mode = self.fitting_mode loss_fn, optimizer = self._init_model(ts) + train_loader, val_loader = self._prepare_data(ts, split_data=True, + collate_fn=getattr(self, '_augment_with_zeros')) + if mode == 'zero_padding': + super()._train_loop( + train_loader=train_loader, + val_loader=val_loader, + loss_fn=loss_fn, + optimizer=optimizer + ) + elif mode == 'moving_window': + self._train_loop( + train_loader=train_loader, + val_loader=None, + loss_fn=loss_fn, + optimizer=optimizer + ) + else: + raise ValueError('Unknown fitting mode') + + def _moving_window_output(self, inputs): + hidden_state = None + output = -torch.ones((inputs.shape[0], self.num_classes)) + for i in self.prediction_idx: + if i >= inputs.shape[-1]: + break + batch_interval = inputs[..., i - self.prediction_idx[0] : i + 1] + output, hidden_state = self.model(batch_interval, hidden_state, return_hidden=True) + return output - train_loader, val_loader = self._prepare_data(ts, split_data=False, - collate_fn=getattr(self, '_augment_zero_padding')) - self._train_loop( - train_loader=train_loader, - val_loader=val_loader, - loss_fn=loss_fn, - optimizer=optimizer, - ) + def _train_loop(self, train_loader, val_loader, loss_fn, optimizer): + early_stopping = EarlyStopping() + scheduler = lr_scheduler.OneCycleLR(optimizer=optimizer, + steps_per_epoch=len(train_loader), + epochs=self.epochs, + max_lr=self.learning_rate) + if val_loader is None: + print('Not enough class samples for validation') + + best_model = None + best_val_loss = float('inf') + val_interval = self.get_validation_frequency( + self.epochs, self.learning_rate) - def _augment_zero_padding(self, batch,): - prediction_idx = self.prediction_idx - x, y = zip(*batch) - X, y = torch.stack(x), torch.stack(y) - y = np.tile(y, (len(prediction_idx), 1)) - res = [] - for i in prediction_idx: - zeroed_X = X[...] - zeroed_X[..., i + 1:] = 0 - res.append(zeroed_X) - res = np.concatenate(res, 0) - perm = np.random.permutation(res.shape[0]) - return torch.tensor(res[perm, ...]), torch.tensor(y[perm]) + for epoch in range(1, self.epochs + 1): + training_loss = 0.0 + valid_loss = 0.0 + self.model.train() + total = 0 + correct = 0 + for batch in tqdm(train_loader): + optimizer.zero_grad() + inputs, targets = batch + output = self._moving_window_output(inputs) + loss = loss_fn(output, targets.float()) + loss.backward() + optimizer.step() + training_loss += loss.data.item() * inputs.size(0) + total += targets.size(0) + correct += (torch.argmax(output, 1) == + torch.argmax(targets, 1)).sum().item() + + accuracy = correct / total + training_loss /= len(train_loader.dataset) + print('Epoch: {}, Accuracy = {}, Training Loss: {:.2f}'.format( + epoch, accuracy, training_loss)) + + if val_loader is not None and epoch % val_interval == 0: + self.model.eval() + total = 0 + correct = 0 + for batch in val_loader: + inputs, targets = batch + + output = self.model(inputs) + + loss = loss_fn(output, targets.float()) + + valid_loss += loss.data.item() * inputs.size(0) + total += targets.size(0) + correct += (torch.argmax(output, 1) == + torch.argmax(targets, 1)).sum().item() + if valid_loss < best_val_loss: + best_val_loss = valid_loss + best_model = copy.deepcopy(self.model) + + early_stopping(training_loss, self.model, './') + adjust_learning_rate(optimizer, scheduler, + epoch + 1, self.learning_rate, printout=False) + scheduler.step() + + if early_stopping.early_stop: + print("Early stopping") + break + + if best_model is not None: + self.model = best_model + + @convert_to_3d_torch_array + def _predict_model(self, x_test: InputData, output_mode: str = 'default'): + self.model.eval() + if self.fitting_mode == 'zero_padding': + x_test = self._padding(x_test).to(self._device) + pred = self.model(x_test) + elif self.fitting_mode == 'moving_window': + pred = self._moving_window_output(torch.tensor(x_test).float()) + else: + raise ValueError('Unknown prediction mode') + return self._convert_predict(pred, output_mode) + + def _padding(self, ts: np.array): + if ts.shape[-1] == self.input_size: + return torch.tensor(ts).float() + n, ch, size = ts.shape + x = torch.zeros((n, ch, self.input_size)).float() + x[..., :size] = ts + return x + + def _augment_with_zeros(self, batch: np.array): + X, y = zip(*batch) + X, y = np.stack(X), np.stack(y) + X_res, y_res = [], [] + for i in self.prediction_idx: + x = X[...] + x[..., :i + i] = 0 + X_res.append(x) + y_res.append(y) + X_res = np.concatenate(X_res) + y_res = np.concatenate(y_res) + perm = np.random.permutation(X_res.shape[0]) + return torch.tensor(X_res[perm]), torch.tensor(y_res[perm]) + + def _transform_score(self, probas): + # linear interp + thr = self.proba_thr + probas = probas - thr + positive = probas > 0 + probas[positive] *= 1 / (1 - thr) + probas[~positive] *= 1 / thr + return probas diff --git a/fedot_ind/core/repository/data/default_operation_params.json b/fedot_ind/core/repository/data/default_operation_params.json index 98a7e2986..cfbf25e1c 100644 --- a/fedot_ind/core/repository/data/default_operation_params.json +++ b/fedot_ind/core/repository/data/default_operation_params.json @@ -124,15 +124,25 @@ "min_samples_leaf": 10, "bootstrap": false }, + "ecec": { + "interval_percentage": 10, + "accuracy_importance": 0.7 + }, + "economy_k": { + "interval_percentage": 10, + "accuracy_importance": 0.7, + "cluster_factor": 1, + "lambda": 1 + }, "teaser": { "interval_percentage": 10, "consecutive_predictions": 3, - "hm_shift_to_acc": 2 + "accuracy_importance": 2 }, "proba_threshold_etc": { "interval_percentage": 10, "consecutive_predictions": 3, - "hm_shift_to_acc": 2 + "accuracy_importance": 2 }, "dt": { "max_depth": 5, diff --git a/fedot_ind/core/repository/data/industrial_model_repository.json b/fedot_ind/core/repository/data/industrial_model_repository.json index 42f58446a..9b624321f 100644 --- a/fedot_ind/core/repository/data/industrial_model_repository.json +++ b/fedot_ind/core/repository/data/industrial_model_repository.json @@ -735,10 +735,18 @@ "non_linear" ] }, - "teaser": { + "ecec": { + "meta": "sklearn_class", + "tags": [ + "interpretable", + "non_lagged", + "non_linear" + ], + "input_type": "[DataTypesEnum.table]" + }, + "economy_k": { "meta": "sklearn_class", "tags": [ - "simple", "interpretable", "non_lagged", "non_linear" @@ -755,6 +763,16 @@ ], "input_type": "[DataTypesEnum.table]" }, + "teaser": { + "meta": "sklearn_class", + "tags": [ + "simple", + "interpretable", + "non_lagged", + "non_linear" + ], + "input_type": "[DataTypesEnum.table]" + }, "xgboost": { "meta": "sklearn_class", "presets": ["*tree"], diff --git a/fedot_ind/core/repository/model_repository.py b/fedot_ind/core/repository/model_repository.py index c7283a1bc..c3e226dc7 100644 --- a/fedot_ind/core/repository/model_repository.py +++ b/fedot_ind/core/repository/model_repository.py @@ -45,8 +45,10 @@ from fedot_ind.core.models.detection.custom.stat_detector import StatisticalDetector from fedot_ind.core.models.detection.probalistic.kalman import UnscentedKalmanFilter from fedot_ind.core.models.detection.subspaces.sst import SingularSpectrumTransformation -from fedot_ind.core.models.early_tc.teaser import TEASER +from fedot_ind.core.models.early_tc.ecec import ECEC +from fedot_ind.core.models.early_tc.economy_k import EconomyK from fedot_ind.core.models.early_tc.prob_threshold import ProbabilityThresholdClassifier +from fedot_ind.core.models.early_tc.teaser import TEASER from fedot_ind.core.models.manifold.riemann_embeding import RiemannExtractor from fedot_ind.core.models.nn.network_impl.dummy_nn import DummyOverComplicatedNeuralNetwork from fedot_ind.core.models.nn.network_impl.deepar import DeepAR @@ -93,8 +95,10 @@ class AtomizedModel(Enum): # for detection 'one_class_svm': OneClassSVM, # Early classification + 'ecec': ECEC, + 'economy_k': EconomyK, + 'proba_threshold_etc': ProbabilityThresholdClassifier, 'teaser': TEASER, - 'proba_threshold_etc': ProbabilityThresholdClassifier } FEDOT_PREPROC_MODEL = { # data standartization diff --git a/fedot_ind/core/tuning/search_space.py b/fedot_ind/core/tuning/search_space.py index 994db4e51..c19e7340e 100644 --- a/fedot_ind/core/tuning/search_space.py +++ b/fedot_ind/core/tuning/search_space.py @@ -65,15 +65,41 @@ 'selection_strategy': {'hyperopt-dist': hp.choice, 'sampling-scope': [['sum', 'pairwise']]} }, - 'teaser': + 'ecec': { + 'interval_percentage': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[5, 10, 20, 25]]}, + 'accuracy_importance': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[i / 10 for i in range(11)]]}, + }, + 'economy_k': { + 'interval_percentage': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[5, 10, 20, 25]]}, + 'lambda': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[1e-6, 1e-3, 1e-2, 1e-1, 1, 1e1, 1e2, 1e3, 1e4, 1e6]]}, + 'accuracy_importance': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[i / 10 for i in range(11)]]}, + }, + 'mlstm_model': { + 'interval_percentage': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[5, 10, 20, 25]]}, + 'dropout': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5]]}, + 'hidden_size': {'hyperopt-dist': hp.choice, + 'sampling-scope': [list(range(10, 101, 10))]}, + 'num_layers': {'hyperopt-dist': hp.choice, + 'sampling-scope': [list(range(1, 6))]}, + 'hidden_channels': {'hyperopt-dist': hp.choice, + 'sampling-scope': [8, 16, 32, 64, 96]}, + }, + 'proba_threshold_etc': {'interval_percentage': {'hyperopt-dist': hp.choice, 'sampling-scope': [[5, 10, 20, 25]]}, 'acceptance_threshold': {'hyperopt-dist': hp.choice, 'sampling_scope': [[1, 2, 3, 4, 5]]}, - 'hm_shift_to_acc': {'hyperopt-dist': hp.choice, + 'accuracy_importance': {'hyperopt-dist': hp.choice, 'sampling-scope': [0.01, 0.1, 0.5, 1, 5, 10, 100]}, }, - 'proba_threshold_etc': + 'teaser': {'interval_percentage': {'hyperopt-dist': hp.choice, 'sampling-scope': [[5, 10, 20, 25]]}, 'acceptance_threshold': {'hyperopt-dist': hp.choice, From 926eb927102b068b2710858351bce05868f300ba Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 12 Jul 2024 15:02:54 +0300 Subject: [PATCH 29/43] slight fixes --- fedot_ind/core/models/early_tc/base_early_tc.py | 2 +- fedot_ind/core/models/early_tc/economy_k.py | 9 ++++++--- .../core/repository/data/default_operation_params.json | 4 ++-- fedot_ind/core/tuning/search_space.py | 6 +++--- 4 files changed, 12 insertions(+), 9 deletions(-) diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index 9fbc162c5..cbed8c463 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -124,7 +124,7 @@ def _score(self, X, y, accuracy_importance=None, training=True): predictions = self._predict(X, training)[0] prediction_points = predictions.shape[0] accuracies = (predictions == np.tile(y, (prediction_points, 1))).sum(axis=1) / len(y) - return (1 + accuracy_importance) * accuracies * self.earliness[:prediction_points] / (accuracy_importance * accuracies + self.earliness[:prediction_points]) + return (1 - accuracy_importance) * self.earliness[:prediction_points] + accuracy_importance * accuracies def _get_applicable_index(self, last_available_idx): idx = np.searchsorted(self.prediction_idx, last_available_idx, side='right') diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py index bf09acd4b..c39097189 100644 --- a/fedot_ind/core/models/early_tc/economy_k.py +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -65,7 +65,7 @@ def __expected_costs(self, X, cluster_centroids, i): np.sum(self.state[i:], axis=-1), axes=(0, 2, 1) ) * self._pyck_[None, ...], axis=1) costs = cluster_probas @ s_glob.T # n_inst x time_left - costs += self.earliness[None, i:] * (1 - self.accuracy_importance) # subtract or add ? + costs -= self.earliness[None, i:] * (1 - self.accuracy_importance) # subtract or add ? return costs def _get_prediction_time(self, X, cluster_centroids, i): @@ -82,8 +82,11 @@ def predict_proba(self, X): def _transform_score(self, time): idx = self._estimator_for_predict[-1] - scores = -(1 - (time - self.prediction_idx[idx]) / self.prediction_idx[-1]) - scores[scores == 0] = 1 # no posibility for lininterp when sure + scores = (1 - (time - self.prediction_idx[idx]) / self.prediction_idx[-1]) # [1 / n; 1 ] - 1 / n) * n /(n - 1) * 2 - 1 + n = self.n_pred + scores -= 1 / n + scores *= n / (n - 1) * 2 + scores -= 1 return scores diff --git a/fedot_ind/core/repository/data/default_operation_params.json b/fedot_ind/core/repository/data/default_operation_params.json index cfbf25e1c..a91a8a938 100644 --- a/fedot_ind/core/repository/data/default_operation_params.json +++ b/fedot_ind/core/repository/data/default_operation_params.json @@ -137,12 +137,12 @@ "teaser": { "interval_percentage": 10, "consecutive_predictions": 3, - "accuracy_importance": 2 + "accuracy_importance": 0.5 }, "proba_threshold_etc": { "interval_percentage": 10, "consecutive_predictions": 3, - "accuracy_importance": 2 + "accuracy_importance": 0.5 }, "dt": { "max_depth": 5, diff --git a/fedot_ind/core/tuning/search_space.py b/fedot_ind/core/tuning/search_space.py index c19e7340e..832eaad26 100644 --- a/fedot_ind/core/tuning/search_space.py +++ b/fedot_ind/core/tuning/search_space.py @@ -97,15 +97,15 @@ 'acceptance_threshold': {'hyperopt-dist': hp.choice, 'sampling_scope': [[1, 2, 3, 4, 5]]}, 'accuracy_importance': {'hyperopt-dist': hp.choice, - 'sampling-scope': [0.01, 0.1, 0.5, 1, 5, 10, 100]}, + 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1,]]}, }, 'teaser': {'interval_percentage': {'hyperopt-dist': hp.choice, 'sampling-scope': [[5, 10, 20, 25]]}, 'acceptance_threshold': {'hyperopt-dist': hp.choice, 'sampling_scope': [[1, 2, 3, 4, 5]]}, - 'hm_shift_to_acc': {'hyperopt-dist': hp.choice, - 'sampling-scope': [0.01, 0.1, 0.5, 1, 5, 10, 100]}, + 'accuracy_importance': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1,]]}, }, 'deepar_model': {'epochs': {'hyperopt-dist': hp.choice, From 49d0570330408700a89905475c03a71293cb4f3a Mon Sep 17 00:00:00 2001 From: leostre Date: Mon, 15 Jul 2024 12:30:35 +0300 Subject: [PATCH 30/43] refactored train loop + microfixes --- .../core/metrics/metrics_implementation.py | 122 +++++++++++++++++- fedot_ind/core/models/early_tc/ecec.py | 6 +- fedot_ind/core/models/early_tc/economy_k.py | 3 +- .../core/models/early_tc/prob_threshold.py | 3 +- fedot_ind/core/models/early_tc/teaser.py | 5 +- .../models/nn/network_impl/base_nn_model.py | 117 ++++++++++------- .../core/models/nn/network_impl/mlstm.py | 97 +++++--------- 7 files changed, 227 insertions(+), 126 deletions(-) diff --git a/fedot_ind/core/metrics/metrics_implementation.py b/fedot_ind/core/metrics/metrics_implementation.py index fea9c2877..8803f18dd 100644 --- a/fedot_ind/core/metrics/metrics_implementation.py +++ b/fedot_ind/core/metrics/metrics_implementation.py @@ -1,6 +1,7 @@ from typing import Optional from typing import Union +import matplotlib.pyplot as plt import numpy as np import pandas as pd from fedot.core.data.data import InputData @@ -220,6 +221,9 @@ def smape(a, f, _=None): return 1 / len(a) * np.sum(2 * np.abs(f - a) / (np.abs(a) + np.abs(f)) * 100) +def rmse(y_true, y_pred): + return np.sqrt(mean_squared_error(y_true, y_pred)) + def mape(A, F): return mean_absolute_percentage_error(A, F) @@ -232,9 +236,6 @@ def calculate_regression_metric(target, **kwargs): target = target.astype(float) - def rmse(y_true, y_pred): - return np.sqrt(mean_squared_error(y_true, y_pred)) - metric_dict = {'r2': r2_score, 'mse': mean_squared_error, 'rmse': rmse, @@ -261,9 +262,6 @@ def calculate_forecasting_metric(target, **kwargs): target = target.astype(float) - def rmse(y_true, y_pred): - return np.sqrt(mean_squared_error(y_true, y_pred)) - metric_dict = { 'rmse': rmse, 'mae': mean_absolute_error, @@ -345,10 +343,95 @@ def kl_divergence(solution: pd.DataFrame, return np.average(solution.sum(axis=1), weights=sample_weights) else: return np.average(solution.mean()) + +class ETSCPareto(QualityMetric, ParetoMetrics): + def __init__(self, + target, + predicted_labels, + predicted_probs=None, + weigths: tuple = None, + mode: str = 'robust', + reduce: bool = True, + metric_list: tuple = ( + 'f1', 'roc_auc', 'accuracy', 'logloss', 'precision'), + default_value: float = 0.0): + self.target = target.flatten() + self.predicted_labels = predicted_labels + self.predicted_probs = predicted_probs + self.metric_list = metric_list + self.default_value = default_value + self.weights = weigths + self.mode = mode + self.columns = ['robustness'] if self.mode == 'robust' else [] + self.columns.extend(metric_list) + self.reduce = reduce + def metric(self) -> float: + if len(self.predicted_labels.shape) == 1: + self.predicted_labels = self.predicted_labels[None, ...] + self.predicted_probs = self.predicted_probs[None, ...] + + n_metrics = len(self.metric_list) + (self.mode == 'robust') + n_est = self.predicted_labels.shape[0] + result = np.zeros((n_est, n_metrics)) + if self.mode == 'robust': + mask = self.predicted_probs >= 0 + if not mask.any(): + return result + robustness = mask.sum(-1) / self.predicted_probs.shape[-1] + result[:, 0] = robustness.flatten() + else: + mask = np.ones_like(self.predicted_probs, dtype=bool) + + for est in range(n_est): + for i, metric in enumerate(self.metric_list, 1): + assert metric in CLASSIFICATION_METRIC_DICT, f'{metric} is not found in available metrics' + metric_value = CLASSIFICATION_METRIC_DICT[metric](self.target[mask[est]], + self.predicted_labels[est][mask[est]]) + result[est, i] = metric_value + + if self.weights is None: + if self.reduce: + self.weights = np.empty(n_metrics) + self.weights.fill(1 / len(self.weights)) + else: + self.weights = np.eye(n_metrics) + else: + assert self.weights.shape[-1] == self.metrics.shape[-1], 'Metrics and weights size mismatch!' + self.weights /= self.weights.sum() + + result = result @ self.weights.T + if not self.reduce: + return pd.DataFrame(result, columns=self.columns) + else: + return result + + def plot_bicrit_metric(self, metrics, select=None, metrics_names=None): + if not metrics_names: + metrics_names = ('Robustness', 'Accuracy') + plt.figure(figsize=(10, 10)) + assert metrics.shape[-1] == 2, 'only 2 metrics can be plotted' + for i, metric in enumerate(metrics): + selection = metric[select] + sizes = ((np.arange(selection.shape[0]) * 2)[::-1]) ** 1.5 + 10 + plt.scatter(*(metric[select]).T, + s=sizes, + label=i) + plt.legend(loc="upper right", bbox_to_anchor=(1.5, 1)) + plt.ylabel(metrics_names[1]) + plt.xlabel(metrics_names[0]) + plt.xlim((-0.05, 1.05)) + plt.ylim((-0.05, 1.05)) + plt.xticks(np.linspace(0, 1, 11)) + plt.yticks(np.linspace(0, 1, 11)) + plt.grid(True) + + def select_pareto_front(self, metrics, maximize=True): + pareto_mask = self.pareto_metric_list(metrics, maximise=maximize) + return metrics[pareto_mask] -class AnomalyMetric(QualityMetric): +class AnomalyMetric(QualityMetric): def __init__(self, target, predicted_labels, @@ -617,3 +700,28 @@ def calculate_detection_metric( target=target, predicted_labels=labels).metric() return metric_dict + +REGRESSION_METRIC_DICT = {'r2': r2_score, + 'mse': mean_squared_error, + 'rmse': rmse, + 'mae': mean_absolute_error, + 'msle': mean_squared_log_error, + 'mape': mean_absolute_percentage_error, + 'median_absolute_error': median_absolute_error, + 'explained_variance_score': explained_variance_score, + 'max_error': max_error, + 'd2_absolute_error_score': d2_absolute_error_score} + +CLASSIFICATION_METRIC_DICT = {'accuracy': accuracy_score, + 'f1': f1_score, + 'roc_auc': roc_auc_score, + 'precision': precision_score, + 'logloss': log_loss} + +FORECASTING_METRICS_DICT = { + 'rmse': rmse, + 'mae': mean_absolute_error, + 'median_absolute_error': median_absolute_error, + 'smape': smape, + 'mase': mase + } diff --git a/fedot_ind/core/models/early_tc/ecec.py b/fedot_ind/core/models/early_tc/ecec.py index f6e163d25..792810ce6 100644 --- a/fedot_ind/core/models/early_tc/ecec.py +++ b/fedot_ind/core/models/early_tc/ecec.py @@ -1,9 +1,11 @@ from typing import Optional -from fedot_ind.core.architecture.settings.computational import backend_methods as np + from fedot.core.operations.operation_parameters import OperationParameters +from fedot_ind.core.architecture.settings.computational import backend_methods as np from fedot_ind.core.models.early_tc.base_early_tc import BaseETC -from sklearn.model_selection import cross_val_predict from sklearn.metrics import confusion_matrix +from sklearn.model_selection import cross_val_predict + class ECEC(BaseETC): def __init__(self, params: Optional[OperationParameters] = None): diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py index c39097189..fae2f409b 100644 --- a/fedot_ind/core/models/early_tc/economy_k.py +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -1,6 +1,7 @@ from typing import Optional -from fedot_ind.core.architecture.settings.computational import backend_methods as np + from fedot.core.operations.operation_parameters import OperationParameters +from fedot_ind.core.architecture.settings.computational import backend_methods as np from fedot_ind.core.models.early_tc.base_early_tc import BaseETC from sklearn.cluster import KMeans from sklearn.metrics import confusion_matrix diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index 773f79d8e..fd1455a36 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -1,6 +1,7 @@ from typing import Optional -from fedot_ind.core.architecture.settings.computational import backend_methods as np + from fedot.core.operations.operation_parameters import OperationParameters +from fedot_ind.core.architecture.settings.computational import backend_methods as np from fedot_ind.core.models.early_tc.base_early_tc import BaseETC class ProbabilityThresholdClassifier(BaseETC): diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 23d6c078d..2dc905508 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -1,6 +1,7 @@ from typing import Optional -from fedot_ind.core.architecture.settings.computational import backend_methods as np + from fedot.core.operations.operation_parameters import OperationParameters +from fedot_ind.core.architecture.settings.computational import backend_methods as np from fedot_ind.core.models.early_tc.base_early_tc import BaseETC from sklearn.model_selection import GridSearchCV from sklearn.svm import OneClassSVM @@ -43,7 +44,7 @@ def _form_X_oc(self, predicted_probas): def _predict(self, X, training=False): estimator_indices, offset = self._select_estimators(X) X_ocs, predicted_probas, predicted_labels = zip( - *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary + *[self._predict_one_slave(X, i, offset) for i in estimator_indices] ) non_acceptance = self._consecutive_count(predicted_labels) < self.consecutive_predictions X_ocs = np.stack(X_ocs) diff --git a/fedot_ind/core/models/nn/network_impl/base_nn_model.py b/fedot_ind/core/models/nn/network_impl/base_nn_model.py index e9d6c7274..f285853d0 100644 --- a/fedot_ind/core/models/nn/network_impl/base_nn_model.py +++ b/fedot_ind/core/models/nn/network_impl/base_nn_model.py @@ -113,6 +113,69 @@ def _prepare_data(self, ts, split_data: bool = True, collate_fn=None): self.label_encoder = train_dataset.label_encoder return train_loader, val_loader + def _train_one_batch(self, batch, optimizer, loss_fn): + optimizer.zero_grad() + inputs, targets = batch + output = self.model(inputs) + loss = loss_fn(output, targets.float()) + loss.backward() + optimizer.step() + training_loss = loss.data.item() * inputs.size(0) + total = targets.size(0) + correct = (torch.argmax(output, 1) == + torch.argmax(targets, 1)).sum().item() + return training_loss, total, correct + + def _eval_one_batch(self, batch, loss_fn): + inputs, targets = batch + output = self.model(inputs) + loss = loss_fn(output, targets.float()) + valid_loss = loss.data.item() * inputs.size(0) + total = targets.size(0) + correct = (torch.argmax(output, 1) == + torch.argmax(targets, 1)).sum().item() + return valid_loss, total, correct + + def _run_one_epoch(self, train_loader, val_loader, + optimizer, loss_fn, + epoch, val_interval, + early_stopping, scheduler, + best_val_loss): + training_loss = 0.0 + valid_loss = 0.0 + self.model.train() + total = 0 + correct = 0 + best_model = self.model + for batch in tqdm(train_loader): + training_loss_batch, total_batch, correct_batch = self._train_one_batch(batch, optimizer, loss_fn) + training_loss += training_loss_batch + total += total_batch + correct += correct_batch + accuracy = correct / total + training_loss /= len(train_loader.dataset) + print('Epoch: {}, Accuracy = {}, Training Loss: {:.2f}'.format( + epoch, accuracy, training_loss)) + + if val_loader is not None and epoch % val_interval == 0: + self.model.eval() + total = 0 + correct = 0 + for batch in val_loader: + valid_loss_batch, total_batch, correct_batch = self._eval_one_batch(batch, loss_fn) + valid_loss += valid_loss_batch + total += total_batch + correct += correct_batch + if valid_loss < best_val_loss: + best_val_loss = valid_loss + best_model = copy.deepcopy(self.model) + + early_stopping(training_loss, self.model, './') + adjust_learning_rate(optimizer, scheduler, + epoch + 1, self.learning_rate, printout=False) + scheduler.step() + return best_model, best_val_loss + def _train_loop(self, train_loader, val_loader, loss_fn, optimizer): early_stopping = EarlyStopping() scheduler = lr_scheduler.OneCycleLR(optimizer=optimizer, @@ -127,53 +190,13 @@ def _train_loop(self, train_loader, val_loader, loss_fn, optimizer): self.epochs, self.learning_rate) loss_prefix = 'RMSE' if self.is_regression_task else 'Accuracy' for epoch in range(1, self.epochs + 1): - training_loss = 0.0 - valid_loss = 0.0 - self.model.train() - total = 0 - correct = 0 - for batch in tqdm(train_loader): - optimizer.zero_grad() - inputs, targets = batch - output = self.model(inputs) - loss = loss_fn(output, targets.float()) - loss.backward() - optimizer.step() - training_loss += loss.data.item() / inputs.size(0) if self.is_regression_task \ - else loss.data.item() * inputs.size(0) - total += targets.size(0) - correct += (torch.argmax(output, 1) == torch.argmax(targets, 1)).sum().item() \ - if not self.is_regression_task else 0 - - training_loss = training_loss / len(train_loader.dataset) if not self.is_regression_task else training_loss - accuracy = correct / total if not self.is_regression_task else training_loss - print('Epoch: {}, {}= {}, Training Loss: {:.2f}'.format( - epoch, loss_prefix, accuracy, training_loss)) - - if val_loader is not None and epoch % val_interval == 0: - self.model.eval() - total = 0 - correct = 0 - for batch in val_loader: - inputs, targets = batch - output = self.model(inputs) - - loss = loss_fn(output, targets.float()) - - valid_loss += loss.data.item() / inputs.size(0) if self.is_regression_task \ - else loss.data.item() * inputs.size(0) - total += targets.size(0) - correct += (torch.argmax(output, 1) == torch.argmax(targets, 1)).sum().item() \ - if not self.is_regression_task else 0 - if valid_loss < best_val_loss: - best_val_loss = valid_loss - best_model = copy.deepcopy(self.model) - - early_stopping(training_loss, self.model, './') - adjust_learning_rate(optimizer, scheduler, - epoch + 1, self.learning_rate, printout=False) - scheduler.step() - + best_model, best_val_loss = self._run_one_epoch( + train_loader, val_loader, + optimizer, loss_fn, + epoch, val_interval, + early_stopping, scheduler, + best_val_loss + ) if early_stopping.early_stop: print("Early stopping") break diff --git a/fedot_ind/core/models/nn/network_impl/mlstm.py b/fedot_ind/core/models/nn/network_impl/mlstm.py index 3e1d3c4b5..604f28660 100644 --- a/fedot_ind/core/models/nn/network_impl/mlstm.py +++ b/fedot_ind/core/models/nn/network_impl/mlstm.py @@ -154,74 +154,39 @@ def _moving_window_output(self, inputs): batch_interval = inputs[..., i - self.prediction_idx[0] : i + 1] output, hidden_state = self.model(batch_interval, hidden_state, return_hidden=True) return output - - def _train_loop(self, train_loader, val_loader, loss_fn, optimizer): - early_stopping = EarlyStopping() - scheduler = lr_scheduler.OneCycleLR(optimizer=optimizer, - steps_per_epoch=len(train_loader), - epochs=self.epochs, - max_lr=self.learning_rate) - if val_loader is None: - print('Not enough class samples for validation') - - best_model = None - best_val_loss = float('inf') - val_interval = self.get_validation_frequency( - self.epochs, self.learning_rate) - - for epoch in range(1, self.epochs + 1): - training_loss = 0.0 - valid_loss = 0.0 - self.model.train() - total = 0 - correct = 0 - for batch in tqdm(train_loader): - optimizer.zero_grad() - inputs, targets = batch - output = self._moving_window_output(inputs) - loss = loss_fn(output, targets.float()) - loss.backward() - optimizer.step() - training_loss += loss.data.item() * inputs.size(0) - total += targets.size(0) - correct += (torch.argmax(output, 1) == + + def _train_one_batch(self, batch, optimizer, loss_fn): + if self.fitting_mode == 'zero_padding': + return super()._train_one_batch(batch, optimizer, loss_fn) + elif self.fitting_mode == 'moving_window': + optimizer.zero_grad() + inputs, targets = batch + output = self._moving_window_output(inputs) + loss = loss_fn(output, targets.float()) + loss.backward() + optimizer.step() + training_loss = loss.data.item() * inputs.size(0) + total = targets.size(0) + correct = (torch.argmax(output, 1) == torch.argmax(targets, 1)).sum().item() - - accuracy = correct / total - training_loss /= len(train_loader.dataset) - print('Epoch: {}, Accuracy = {}, Training Loss: {:.2f}'.format( - epoch, accuracy, training_loss)) - - if val_loader is not None and epoch % val_interval == 0: - self.model.eval() - total = 0 - correct = 0 - for batch in val_loader: - inputs, targets = batch - - output = self.model(inputs) - - loss = loss_fn(output, targets.float()) - - valid_loss += loss.data.item() * inputs.size(0) - total += targets.size(0) - correct += (torch.argmax(output, 1) == + return training_loss, total, correct + else: + raise ValueError('Unknown fitting mode!') + + def _eval_one_batch(self, batch, loss_fn): + if self.fitting_mode == 'zero_padding': + return super()._eval_one_batch(batch, loss_fn) + elif self.fitting_mode == 'moving_window': + inputs, targets = batch + output = self._moving_window_output(inputs) + loss = loss_fn(output, targets.float()) + valid_loss = loss.data.item() * inputs.size(0) + total = targets.size(0) + correct = (torch.argmax(output, 1) == torch.argmax(targets, 1)).sum().item() - if valid_loss < best_val_loss: - best_val_loss = valid_loss - best_model = copy.deepcopy(self.model) - - early_stopping(training_loss, self.model, './') - adjust_learning_rate(optimizer, scheduler, - epoch + 1, self.learning_rate, printout=False) - scheduler.step() - - if early_stopping.early_stop: - print("Early stopping") - break - - if best_model is not None: - self.model = best_model + return valid_loss, total, correct + else: + raise ValueError('Unknown fitting mode!') @convert_to_3d_torch_array def _predict_model(self, x_test: InputData, output_mode: str = 'default'): From 2e2ad91d0b3ed6e23cab0a8ca2e801c25f5fdd7b Mon Sep 17 00:00:00 2001 From: leostre Date: Wed, 17 Jul 2024 02:33:53 +0300 Subject: [PATCH 31/43] to pull req --- fedot_ind/core/models/early_tc/base_early_tc.py | 4 ++-- fedot_ind/core/models/early_tc/ecec.py | 3 --- fedot_ind/core/models/early_tc/economy_k.py | 1 - fedot_ind/core/models/early_tc/prob_threshold.py | 2 -- fedot_ind/core/models/early_tc/teaser.py | 7 ++----- 5 files changed, 4 insertions(+), 13 deletions(-) diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index cbed8c463..9c8e12cb8 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -85,9 +85,9 @@ def _predict(self, X, training=True): estimator_indices, offset = self._select_estimators(X, training) if not training: self._estimator_for_predict = estimator_indices - prediction = zip( + prediction = (np.stack(array_list) for array_list in zip( *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary - ) + )) return prediction # see the output in _predict_one_slave def _consecutive_count(self, predicted_labels: List[np.array]): diff --git a/fedot_ind/core/models/early_tc/ecec.py b/fedot_ind/core/models/early_tc/ecec.py index 792810ce6..576b3a4ba 100644 --- a/fedot_ind/core/models/early_tc/ecec.py +++ b/fedot_ind/core/models/early_tc/ecec.py @@ -23,11 +23,8 @@ def _predict_one_slave(self, X, i, offset=0): def _predict(self, X, training=False): predicted_labels, predicted_probas, reliabilities = super()._predict(X, training) - reliabilities = np.stack(reliabilities) confidences = 1 - np.cumprod(1 - reliabilities, axis=0) non_confident = confidences < self.confidence_thresholds[:len(predicted_labels), None] - predicted_labels = np.stack(predicted_labels) - predicted_probas = np.stack(predicted_probas) return predicted_labels, predicted_probas, non_confident, confidences def predict_proba(self, X): diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py index fae2f409b..481cad97b 100644 --- a/fedot_ind/core/models/early_tc/economy_k.py +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -78,7 +78,6 @@ def _get_prediction_time(self, X, cluster_centroids, i): def predict_proba(self, X): probas, times, _ = self._predict(X, training=False) - probas, times = np.stack(probas), np.stack(times) return super().predict_proba(probas, times) def _transform_score(self, time): diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index fd1455a36..b72a927f1 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -24,8 +24,6 @@ def predict_proba(self, X): def _predict(self, X, training=True): predicted_probas, predicted_labels = super()._predict(X, training) - predicted_probas = np.stack(predicted_probas) - predicted_labels = np.stack(predicted_labels) non_acceptance = self._consecutive_count(predicted_labels) < self.consecutive_predictions double_check = predicted_probas.max(axis=-1) > self.probability_threshold non_acceptance[non_acceptance & double_check] = False diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 2dc905508..0350d0886 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -43,13 +43,10 @@ def _form_X_oc(self, predicted_probas): def _predict(self, X, training=False): estimator_indices, offset = self._select_estimators(X) - X_ocs, predicted_probas, predicted_labels = zip( + X_ocs, predicted_probas, predicted_labels = map(np.stack, zip( *[self._predict_one_slave(X, i, offset) for i in estimator_indices] - ) + )) non_acceptance = self._consecutive_count(predicted_labels) < self.consecutive_predictions - X_ocs = np.stack(X_ocs) - predicted_probas = np.stack(predicted_probas) - predicted_labels = np.stack(predicted_labels) final_verdicts = np.zeros((len(estimator_indices), X.shape[0])) # for each point of estimation for i in range(predicted_labels.shape[0]): From fa802695e1d1b855f468844d5301a0ec7b21ced7 Mon Sep 17 00:00:00 2001 From: autopep8 bot Date: Tue, 16 Jul 2024 23:52:38 +0000 Subject: [PATCH 32/43] Automated autopep8 fixes --- fedot_ind/core/metrics/interval_metrics.py | 62 +++++----- .../core/metrics/metrics_implementation.py | 55 ++++----- .../core/models/early_tc/base_early_tc.py | 36 +++--- fedot_ind/core/models/early_tc/ecec.py | 29 +++-- fedot_ind/core/models/early_tc/economy_k.py | 50 ++++---- fedot_ind/core/models/early_tc/metrics.py | 62 +++++----- .../core/models/early_tc/prob_threshold.py | 9 +- fedot_ind/core/models/early_tc/teaser.py | 32 +++--- .../models/nn/network_impl/base_nn_model.py | 12 +- .../core/models/nn/network_impl/mlstm.py | 108 +++++++++--------- fedot_ind/core/tuning/search_space.py | 50 ++++---- tests/unit/core/models/test_teaser.py | 5 +- 12 files changed, 262 insertions(+), 248 deletions(-) diff --git a/fedot_ind/core/metrics/interval_metrics.py b/fedot_ind/core/metrics/interval_metrics.py index f4a5f6544..f95586147 100644 --- a/fedot_ind/core/metrics/interval_metrics.py +++ b/fedot_ind/core/metrics/interval_metrics.py @@ -1,17 +1,18 @@ from sklearn.metrics import confusion_matrix import numpy as np -import pandas as pd -from fedot.core.data.data import InputData, OutputData -from typing import Tuple, List, Optional, Union, Literal +import pandas as pd +from typing import Union, Literal + def conf_matrix(actual, predicted): cm = confusion_matrix(actual, predicted) return dict(TN=cm[0, 0], FP=cm[0, 1], FN=cm[1, 0], TP=[1, 1]) + def average_delay(boundaries, prediction, - point, - use_idx=True, - window_placement='lefter'): + point, + use_idx=True, + window_placement='lefter'): cp_confusion = extract_cp_cm(boundaries, prediction, use_idx=use_idx, use_switch_point=False) # statistics statistics = { @@ -29,14 +30,16 @@ def average_delay(boundaries, prediction, i: time_func(triplet) for i, triplet in cp_confusion['TPs'].items() } return detection_history, statistics - + + def tp_transform(tps): return np.diff(tps[[1, 0]], axis=0) / np.diff(tps[[-1, 0]], axis=0) + def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], - prediction: pd.DataFrame, - use_switch_point: bool = True, # if first anomaly dot is considered as changepoint - use_idx: bool = False): + prediction: pd.DataFrame, + use_switch_point: bool = True, # if first anomaly dot is considered as changepoint + use_idx: bool = False): if isinstance(boundaries, pd.DataFrame): boundaries = boundaries.values.T anomaly_tsp = prediction[prediction == 1].sort_index().index @@ -44,18 +47,18 @@ def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], if boundaries.shape[1]: - FPs += [anomaly_tsp[anomaly_tsp < boundaries[0, 0]]] # left rest + FPs += [anomaly_tsp[anomaly_tsp < boundaries[0, 0]]] # left rest for i, (b_low, b_up) in enumerate(boundaries): all_tsp_in_window = prediction[b_low: b_up].index anomaly_tsp_in_window = anomaly_tsp_in_window & anomaly_tsp - if not len(anomaly_tsp_in_window): # why not false positive? do we expect an anomaly to be in every interval? + if not len(anomaly_tsp_in_window): # why not false positive? do we expect an anomaly to be in every interval? FNs.append(i if use_idx else all_tsp_in_window) - TPs[i] = [b_low, - anomaly_tsp_in_window[int(use_switch_point)] if use_idx else anomaly_tsp_in_window, + TPs[i] = [b_low, + anomaly_tsp_in_window[int(use_switch_point)] if use_idx else anomaly_tsp_in_window, b_up] if not use_idx: FNs.append(all_tsp_in_window - anomaly_tsp_in_window) - FPs.append(anomaly_tsp[anomaly_tsp > boundaries[-1, -1]]) # right rest + FPs.append(anomaly_tsp[anomaly_tsp > boundaries[-1, -1]]) # right rest else: FPs.append(anomaly_tsp) @@ -69,9 +72,11 @@ def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], ) # cognate of single_detecting_boundaries -def get_boundaries(idx, actual_timestamps, window_size:int = None, - window_placement: Literal['left', 'right', 'central'] = 'left', - intersection_mode: Literal['uniform', 'shift_to_left', 'shift_to_right'] = 'shift_to_left', + + +def get_boundaries(idx, actual_timestamps, window_size: int = None, + window_placement: Literal['left', 'right', 'central'] = 'left', + intersection_mode: Literal['uniform', 'shift_to_left', 'shift_to_right'] = 'shift_to_left', ): # idx = idx # cast everything to pandas object fir the subsequent comfort @@ -82,30 +87,30 @@ def get_boundaries(idx, actual_timestamps, window_size:int = None, else: idx = pd.Series(idx) td = window_size - else: + else: raise TypeError('Unexpected type of ts index') - + boundaries = np.tile(actual_timestamps, (2, 1)) - # [0, ...] - lower bound, [1, ...] - upper + # [0, ...] - lower bound, [1, ...] - upper if window_placement == 'left': boundaries[0] -= td elif window_placement == 'central': boundaries[0] -= td / 2 boundaries[1] += td / 2 elif window_placement == 'right': - boundaries[1] += td + boundaries[1] += td else: raise ValueError('Unknown mode') - + if not len(actual_timestamps): return boundaries - # intersection resolution + # intersection resolution for i in range(len(actual_timestamps) - 1): if not boundaries[0, i + 1] > boundaries[1, i]: continue - if intersection_mode == 'shift_to_left': + if intersection_mode == 'shift_to_left': boundaries[0, i + 1] = boundaries[1, i] elif intersection_mode == 'shift_to_right': boundaries[1, i] = boundaries[0, i + 1] @@ -120,6 +125,7 @@ def get_boundaries(idx, actual_timestamps, window_size:int = None, boundaries = pd.DataFrame({'lower': boundaries[0], 'upper': boundaries[1]}) return boundaries + def nab(boundaries, predictions, mode='standard', custom_coefs=None): inner_coefs = { 'low_FP': [1.0, -0.11, -1.0], @@ -128,11 +134,9 @@ def nab(boundaries, predictions, mode='standard', custom_coefs=None): } coefs = custom_coefs or inner_coefs[mode] confusion_matrix = extract_cp_cm(boundaries, predictions) - + tps = confusion_matrix['tps'] - score = np.inner([tps, len(confusion_matrix['FP']), len(confusion_matrix['FN'])], + score = np.inner([tps, len(confusion_matrix['FP']), len(confusion_matrix['FN'])], coefs) return score - - diff --git a/fedot_ind/core/metrics/metrics_implementation.py b/fedot_ind/core/metrics/metrics_implementation.py index 8803f18dd..e419023ef 100644 --- a/fedot_ind/core/metrics/metrics_implementation.py +++ b/fedot_ind/core/metrics/metrics_implementation.py @@ -221,6 +221,7 @@ def smape(a, f, _=None): return 1 / len(a) * np.sum(2 * np.abs(f - a) / (np.abs(a) + np.abs(f)) * 100) + def rmse(y_true, y_pred): return np.sqrt(mean_squared_error(y_true, y_pred)) @@ -343,7 +344,8 @@ def kl_divergence(solution: pd.DataFrame, return np.average(solution.sum(axis=1), weights=sample_weights) else: return np.average(solution.mean()) - + + class ETSCPareto(QualityMetric, ParetoMetrics): def __init__(self, target, @@ -387,7 +389,7 @@ def metric(self) -> float: for i, metric in enumerate(self.metric_list, 1): assert metric in CLASSIFICATION_METRIC_DICT, f'{metric} is not found in available metrics' metric_value = CLASSIFICATION_METRIC_DICT[metric](self.target[mask[est]], - self.predicted_labels[est][mask[est]]) + self.predicted_labels[est][mask[est]]) result[est, i] = metric_value if self.weights is None: @@ -399,13 +401,13 @@ def metric(self) -> float: else: assert self.weights.shape[-1] == self.metrics.shape[-1], 'Metrics and weights size mismatch!' self.weights /= self.weights.sum() - + result = result @ self.weights.T if not self.reduce: return pd.DataFrame(result, columns=self.columns) else: return result - + def plot_bicrit_metric(self, metrics, select=None, metrics_names=None): if not metrics_names: metrics_names = ('Robustness', 'Accuracy') @@ -414,8 +416,8 @@ def plot_bicrit_metric(self, metrics, select=None, metrics_names=None): for i, metric in enumerate(metrics): selection = metric[select] sizes = ((np.arange(selection.shape[0]) * 2)[::-1]) ** 1.5 + 10 - plt.scatter(*(metric[select]).T, - s=sizes, + plt.scatter(*(metric[select]).T, + s=sizes, label=i) plt.legend(loc="upper right", bbox_to_anchor=(1.5, 1)) plt.ylabel(metrics_names[1]) @@ -425,7 +427,7 @@ def plot_bicrit_metric(self, metrics, select=None, metrics_names=None): plt.xticks(np.linspace(0, 1, 11)) plt.yticks(np.linspace(0, 1, 11)) plt.grid(True) - + def select_pareto_front(self, metrics, maximize=True): pareto_mask = self.pareto_metric_list(metrics, maximise=maximize) return metrics[pareto_mask] @@ -701,27 +703,28 @@ def calculate_detection_metric( predicted_labels=labels).metric() return metric_dict + REGRESSION_METRIC_DICT = {'r2': r2_score, - 'mse': mean_squared_error, - 'rmse': rmse, - 'mae': mean_absolute_error, - 'msle': mean_squared_log_error, - 'mape': mean_absolute_percentage_error, - 'median_absolute_error': median_absolute_error, - 'explained_variance_score': explained_variance_score, - 'max_error': max_error, - 'd2_absolute_error_score': d2_absolute_error_score} + 'mse': mean_squared_error, + 'rmse': rmse, + 'mae': mean_absolute_error, + 'msle': mean_squared_log_error, + 'mape': mean_absolute_percentage_error, + 'median_absolute_error': median_absolute_error, + 'explained_variance_score': explained_variance_score, + 'max_error': max_error, + 'd2_absolute_error_score': d2_absolute_error_score} CLASSIFICATION_METRIC_DICT = {'accuracy': accuracy_score, - 'f1': f1_score, - 'roc_auc': roc_auc_score, - 'precision': precision_score, - 'logloss': log_loss} + 'f1': f1_score, + 'roc_auc': roc_auc_score, + 'precision': precision_score, + 'logloss': log_loss} FORECASTING_METRICS_DICT = { - 'rmse': rmse, - 'mae': mean_absolute_error, - 'median_absolute_error': median_absolute_error, - 'smape': smape, - 'mase': mase - } + 'rmse': rmse, + 'mae': mean_absolute_error, + 'median_absolute_error': median_absolute_error, + 'smape': smape, + 'mase': mase +} diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index 9c8e12cb8..f49a98127 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -7,9 +7,9 @@ class BaseETC(ClassifierMixin, BaseEstimator): - def __init__(self, params: Optional[OperationParameters] = None): + def __init__(self, params: Optional[OperationParameters] = None): if params is None: - params = {} + params = {} super().__init__() self.interval_percentage = params.get('interval_percentage', 10) self.consecutive_predictions = params.get('consecutive_predictions', 1) @@ -26,7 +26,9 @@ def _init_model(self, X, y): max_data_length = X.shape[-1] self.prediction_idx = self._compute_prediction_points(max_data_length) self.n_pred = len(self.prediction_idx) - self.slave_estimators = [WEASEL(random_state=self.random_state, support_probabilities=True, **self.weasel_params) for _ in range(self.n_pred)] + self.slave_estimators = [ + WEASEL(random_state=self.random_state, support_probabilities=True, **self.weasel_params) + for _ in range(self.n_pred)] self.scalers = [StandardScaler() for _ in range(self.n_pred)] self._chosen_estimator_idx = -1 self.classes_ = [np.unique(y)] @@ -37,7 +39,7 @@ def required_length(self): if not hasattr(self, '_chosen_estimator_idx'): return None return self.prediction_idx[self._chosen_estimator_idx] - + @property def n_classes(self): return len(self.classes_[0]) @@ -50,23 +52,23 @@ def fit(self, X, y=None): self._fit_one_interval(X, y, i) def _fit_one_interval(self, X, y, i): - X_part = X[..., :self.prediction_idx[i] + 1] + X_part = X[..., :self.prediction_idx[i] + 1] X_part = self.scalers[i].fit_transform(X_part) probas = self.slave_estimators[i].fit_predict_proba(X_part, y) return probas def _predict_one_slave(self, X, i, offset=0): - X_part = X[..., max(0, offset - 1):self.prediction_idx[i] + 1] + X_part = X[..., max(0, offset - 1):self.prediction_idx[i] + 1] X_part = self.scalers[i].transform(X_part) probas = self.slave_estimators[i].predict_proba(X_part) - return probas, np.argmax(probas, axis=-1) - + return probas, np.argmax(probas, axis=-1) + def _compute_prediction_points(self, n_idx): interval_length = max(int(n_idx * self.interval_percentage / 100), self.min_ts_length) prediction_idx = np.arange(n_idx - 1, -1, -interval_length)[::-1][1:] - self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 + self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 return prediction_idx - + def _select_estimators(self, X, training=False): offset = 0 if not training and self.prediction_mode == 'best_by_harmonic_mean': @@ -80,15 +82,15 @@ def _select_estimators(self, X, training=False): else: raise ValueError('Unknown prediction mode') return estimator_indices, offset - + def _predict(self, X, training=True): estimator_indices, offset = self._select_estimators(X, training) if not training: self._estimator_for_predict = estimator_indices prediction = (np.stack(array_list) for array_list in zip( - *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary + *[self._predict_one_slave(X, i, offset) for i in estimator_indices] # check boundary )) - return prediction # see the output in _predict_one_slave + return prediction # see the output in _predict_one_slave def _consecutive_count(self, predicted_labels: List[np.array]): n = len(predicted_labels[0]) @@ -97,10 +99,10 @@ def _consecutive_count(self, predicted_labels: List[np.array]): for i in range(1, prediction_points): equal = predicted_labels[i - 1] == predicted_labels[i] consecutive_labels[i, equal] = consecutive_labels[i - 1, equal] + 1 - return consecutive_labels # prediction_points x n_instances - + return consecutive_labels # prediction_points x n_instances + def predict_proba(self, *args): - predicted_probas, scores, *_ = args + predicted_probas, scores, *_ = args if self.transform_score: scores = self._transform_score(scores) scores = np.tile(scores[..., None], (1, 1, self.n_classes)) @@ -108,7 +110,7 @@ def predict_proba(self, *args): if prediction.shape[1] == 1: prediction = prediction.squeeze(1) return prediction - + def predict(self, X): prediction = self.predict_proba(X) labels = prediction[0:1].argmax(-1) diff --git a/fedot_ind/core/models/early_tc/ecec.py b/fedot_ind/core/models/early_tc/ecec.py index 576b3a4ba..b210d6cfa 100644 --- a/fedot_ind/core/models/early_tc/ecec.py +++ b/fedot_ind/core/models/early_tc/ecec.py @@ -11,27 +11,27 @@ class ECEC(BaseETC): def __init__(self, params: Optional[OperationParameters] = None): super().__init__(params) self.__cv = 5 - + def _init_model(self, X, y): super()._init_model(X, y) self._reliabilities = np.zeros((self.n_pred, self.n_classes, self.n_classes)) def _predict_one_slave(self, X, i, offset=0): - predicted_probas, predicted_labels = super()._predict_one_slave(X, i, offset) - reliabilities = self._reliabilities[i, predicted_labels, predicted_labels].flatten() # n_inst + predicted_probas, predicted_labels = super()._predict_one_slave(X, i, offset) + reliabilities = self._reliabilities[i, predicted_labels, predicted_labels].flatten() # n_inst return predicted_labels.astype(int), predicted_probas, reliabilities - + def _predict(self, X, training=False): predicted_labels, predicted_probas, reliabilities = super()._predict(X, training) confidences = 1 - np.cumprod(1 - reliabilities, axis=0) non_confident = confidences < self.confidence_thresholds[:len(predicted_labels), None] return predicted_labels, predicted_probas, non_confident, confidences - + def predict_proba(self, X): _, predicted_probas, non_confident, confidences = self._predict(X) predicted_probas[non_confident] = -1 return super().predict_proba(predicted_probas, confidences) - + def _fit_one_interval(self, X, y, i): X_part = X[..., :self.prediction_idx[i] + 1] X_part = self.scalers[i].fit_transform(X_part) @@ -40,20 +40,20 @@ def _fit_one_interval(self, X, y, i): return labels def _score(self, y, y_pred, alpha): - matches = (y_pred == np.tile(y, (self.n_pred, 1))) # n_pred x n_inst + matches = (y_pred == np.tile(y, (self.n_pred, 1))) # n_pred x n_inst n, n_inst, *_ = matches.shape confidences = np.ones((n, n_inst), dtype='float32') for i in range(self.n_pred): confidences[i] = self._reliabilities[i, y, y_pred[i]] - confidences = 1 - np.cumprod(1 - confidences, axis=0) # n_pred x n_inst - candidates = self._select_thrs(confidences) # n_candidates + confidences = 1 - np.cumprod(1 - confidences, axis=0) # n_pred x n_inst + candidates = self._select_thrs(confidences) # n_candidates cfs = np.zeros((len(candidates), n)) for i, candidate in enumerate(candidates): mask = confidences >= candidate # n_pred x n_inst - accuracy_for_candidate = (matches * mask).sum(1) / mask.sum(1) # n_pred + accuracy_for_candidate = (matches * mask).sum(1) / mask.sum(1) # n_pred cfs[i] = self.cost_func(self.earliness, accuracy_for_candidate, alpha) self._chosen_estimator_idx = np.argmin(cfs.mean(0)) - return candidates[np.argmin(cfs, axis=0)] # n_pred + return candidates[np.argmin(cfs, axis=0)] # n_pred @staticmethod def _select_thrs(confidences): @@ -62,13 +62,13 @@ def _select_thrs(confidences): pair_means = C[:-1] + difference / 2 difference_shifted = np.roll(difference, 1) difference_idx = np.argwhere(difference <= difference_shifted) - means_candidates = pair_means[difference_idx].flatten() + means_candidates = pair_means[difference_idx].flatten() return means_candidates if len(means_candidates) else C - + @staticmethod def cost_func(earliness, accuracies, alpha): return alpha * (1 - accuracies) + (1 - alpha) * earliness - + def fit(self, X, y): y = np.array(y).flatten().astype(int) self._init_model(X, y) @@ -89,4 +89,3 @@ def _transform_score(self, confidences): confidences[positive] *= 1 / (1 - thr) confidences[~positive] *= 1 / thr return confidences - \ No newline at end of file diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py index 8847c1e8c..68649f00e 100644 --- a/fedot_ind/core/models/early_tc/economy_k.py +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -7,14 +7,15 @@ from sklearn.metrics import confusion_matrix from sklearn.model_selection import cross_val_predict + class EconomyK(BaseETC): - def __init__(self, params: Optional[OperationParameters] = None): + def __init__(self, params: Optional[OperationParameters] = None): if params is None: - params = {} + params = {} super().__init__(params) self.prediction_mode = params.get('prediction_mode', 'last_available') self.lambda_ = params.get('lambda', 1.) - self._cluster_factor = params.get('cluster_factor' , 1) + self._cluster_factor = params.get('cluster_factor', 1) self._random_state = 2104 self.__cv = 5 @@ -22,21 +23,23 @@ def _init_model(self, X, y): super()._init_model(X, y) self.n_clusters = int(self._cluster_factor * self.n_classes) self._clusterizer = KMeans(self.n_clusters, random_state=self._random_state) - self.state = np.zeros((self.n_pred, self.n_clusters, self.n_classes, self.n_classes)) + self.state = np.zeros((self.n_pred, self.n_clusters, self.n_classes, self.n_classes)) def fit(self, X, y): y = y.flatten().astype(int) self._init_model(X, y) - self._pyck_ = confusion_matrix(y, self._clusterizer.fit(X).labels_, normalize='true')[:self.n_classes, :self.n_clusters] + self._pyck_ = confusion_matrix( + y, self._clusterizer.fit(X).labels_, normalize='true')[ + :self.n_classes, :self.n_clusters] for i in range(self.n_pred): self._fit_one_interval(X, y, i) - + def _fit_one_interval(self, X, y, i): X_part = X[..., :self.prediction_idx[i] + 1] X_part = self.scalers[i].fit_transform(X_part) y_pred = cross_val_predict(self.slave_estimators[i], X_part, y, cv=self.__cv) self.slave_estimators[i].fit(X_part, y) - states_by_i = np.zeros(( self.n_clusters, self.n_classes, self.n_classes)) + states_by_i = np.zeros((self.n_clusters, self.n_classes, self.n_classes)) np.add.at(states_by_i, (self._clusterizer.labels_, y, y_pred), 1) states_by_i /= np.mean(states_by_i, -2, keepdims=True) states_by_i[np.isnan(states_by_i)] = 0 @@ -44,45 +47,46 @@ def _fit_one_interval(self, X, y, i): self.state[i] = states_by_i def _predict_one_slave(self, X, i, offset=0): - cluster_centers = self._clusterizer.cluster_centers_[:, :self.prediction_idx[i] + 1] # n_clust x len + cluster_centers = self._clusterizer.cluster_centers_[:, :self.prediction_idx[i] + 1] # n_clust x len X_part = X[..., max(0, offset - 1):self.prediction_idx[i] + 1] # n_inst x len X_part = self.scalers[i].transform(X_part) probas = self.slave_estimators[i].predict_proba(X_part) - optimal_time, is_optimal = self._get_prediction_time(X_part, cluster_centers, i) + optimal_time, is_optimal = self._get_prediction_time(X_part, cluster_centers, i) return probas, optimal_time, is_optimal - + def __cluster_probas(self, X, centroids): length = centroids.shape[-1] diffs = np.subtract.outer(X, centroids).swapaxes(1, 2) - diffs = diffs[..., np.eye(length).astype(bool)] # n_inst x n_clust x len - distances = np.linalg.norm(diffs, axis=-1) + diffs = diffs[..., np.eye(length).astype(bool)] # n_inst x n_clust x len + distances = np.linalg.norm(diffs, axis=-1) delta_k = 1. - distances / distances.mean(axis=-1)[:, None] - s = 1. / (1. + np.exp(-self.lambda_ * delta_k)) - return s / s.sum(axis=-1)[:, None] # n_inst x n_clust + s = 1. / (1. + np.exp(-self.lambda_ * delta_k)) + return s / s.sum(axis=-1)[:, None] # n_inst x n_clust def __expected_costs(self, X, cluster_centroids, i): - cluster_probas = self.__cluster_probas(X, cluster_centroids) # n_inst x n_clust + cluster_probas = self.__cluster_probas(X, cluster_centroids) # n_inst x n_clust s_glob = np.sum(np.transpose( - np.sum(self.state[i:], axis=-1), axes=(0, 2, 1) - ) * self._pyck_[None, ...], axis=1) - costs = cluster_probas @ s_glob.T # n_inst x time_left - costs -= self.earliness[None, i:] * (1 - self.accuracy_importance) # subtract or add ? + np.sum(self.state[i:], axis=-1), axes=(0, 2, 1) + ) * self._pyck_[None, ...], axis=1) + costs = cluster_probas @ s_glob.T # n_inst x time_left + costs -= self.earliness[None, i:] * (1 - self.accuracy_importance) # subtract or add ? return costs def _get_prediction_time(self, X, cluster_centroids, i): - costs = self.__expected_costs(X, cluster_centroids, i) + costs = self.__expected_costs(X, cluster_centroids, i) min_costs = np.argmin(costs, axis=-1) is_optimal = min_costs == 0 time_optimal = self.prediction_idx[min_costs + i] - return time_optimal, is_optimal # n_inst - + return time_optimal, is_optimal # n_inst + def predict_proba(self, X): probas, times, _ = self._predict(X, training=False) return super().predict_proba(probas, times) def _transform_score(self, time): idx = self._estimator_for_predict[-1] - scores = (1 - (time - self.prediction_idx[idx]) / self.prediction_idx[-1]) # [1 / n; 1 ] - 1 / n) * n /(n - 1) * 2 - 1 + # [1 / n; 1 ] - 1 / n) * n /(n - 1) * 2 - 1 + scores = (1 - (time - self.prediction_idx[idx]) / self.prediction_idx[-1]) n = self.n_pred scores -= 1 / n scores *= n / (n - 1) * 2 diff --git a/fedot_ind/core/models/early_tc/metrics.py b/fedot_ind/core/models/early_tc/metrics.py index f4a5f6544..f95586147 100644 --- a/fedot_ind/core/models/early_tc/metrics.py +++ b/fedot_ind/core/models/early_tc/metrics.py @@ -1,17 +1,18 @@ from sklearn.metrics import confusion_matrix import numpy as np -import pandas as pd -from fedot.core.data.data import InputData, OutputData -from typing import Tuple, List, Optional, Union, Literal +import pandas as pd +from typing import Union, Literal + def conf_matrix(actual, predicted): cm = confusion_matrix(actual, predicted) return dict(TN=cm[0, 0], FP=cm[0, 1], FN=cm[1, 0], TP=[1, 1]) + def average_delay(boundaries, prediction, - point, - use_idx=True, - window_placement='lefter'): + point, + use_idx=True, + window_placement='lefter'): cp_confusion = extract_cp_cm(boundaries, prediction, use_idx=use_idx, use_switch_point=False) # statistics statistics = { @@ -29,14 +30,16 @@ def average_delay(boundaries, prediction, i: time_func(triplet) for i, triplet in cp_confusion['TPs'].items() } return detection_history, statistics - + + def tp_transform(tps): return np.diff(tps[[1, 0]], axis=0) / np.diff(tps[[-1, 0]], axis=0) + def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], - prediction: pd.DataFrame, - use_switch_point: bool = True, # if first anomaly dot is considered as changepoint - use_idx: bool = False): + prediction: pd.DataFrame, + use_switch_point: bool = True, # if first anomaly dot is considered as changepoint + use_idx: bool = False): if isinstance(boundaries, pd.DataFrame): boundaries = boundaries.values.T anomaly_tsp = prediction[prediction == 1].sort_index().index @@ -44,18 +47,18 @@ def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], if boundaries.shape[1]: - FPs += [anomaly_tsp[anomaly_tsp < boundaries[0, 0]]] # left rest + FPs += [anomaly_tsp[anomaly_tsp < boundaries[0, 0]]] # left rest for i, (b_low, b_up) in enumerate(boundaries): all_tsp_in_window = prediction[b_low: b_up].index anomaly_tsp_in_window = anomaly_tsp_in_window & anomaly_tsp - if not len(anomaly_tsp_in_window): # why not false positive? do we expect an anomaly to be in every interval? + if not len(anomaly_tsp_in_window): # why not false positive? do we expect an anomaly to be in every interval? FNs.append(i if use_idx else all_tsp_in_window) - TPs[i] = [b_low, - anomaly_tsp_in_window[int(use_switch_point)] if use_idx else anomaly_tsp_in_window, + TPs[i] = [b_low, + anomaly_tsp_in_window[int(use_switch_point)] if use_idx else anomaly_tsp_in_window, b_up] if not use_idx: FNs.append(all_tsp_in_window - anomaly_tsp_in_window) - FPs.append(anomaly_tsp[anomaly_tsp > boundaries[-1, -1]]) # right rest + FPs.append(anomaly_tsp[anomaly_tsp > boundaries[-1, -1]]) # right rest else: FPs.append(anomaly_tsp) @@ -69,9 +72,11 @@ def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], ) # cognate of single_detecting_boundaries -def get_boundaries(idx, actual_timestamps, window_size:int = None, - window_placement: Literal['left', 'right', 'central'] = 'left', - intersection_mode: Literal['uniform', 'shift_to_left', 'shift_to_right'] = 'shift_to_left', + + +def get_boundaries(idx, actual_timestamps, window_size: int = None, + window_placement: Literal['left', 'right', 'central'] = 'left', + intersection_mode: Literal['uniform', 'shift_to_left', 'shift_to_right'] = 'shift_to_left', ): # idx = idx # cast everything to pandas object fir the subsequent comfort @@ -82,30 +87,30 @@ def get_boundaries(idx, actual_timestamps, window_size:int = None, else: idx = pd.Series(idx) td = window_size - else: + else: raise TypeError('Unexpected type of ts index') - + boundaries = np.tile(actual_timestamps, (2, 1)) - # [0, ...] - lower bound, [1, ...] - upper + # [0, ...] - lower bound, [1, ...] - upper if window_placement == 'left': boundaries[0] -= td elif window_placement == 'central': boundaries[0] -= td / 2 boundaries[1] += td / 2 elif window_placement == 'right': - boundaries[1] += td + boundaries[1] += td else: raise ValueError('Unknown mode') - + if not len(actual_timestamps): return boundaries - # intersection resolution + # intersection resolution for i in range(len(actual_timestamps) - 1): if not boundaries[0, i + 1] > boundaries[1, i]: continue - if intersection_mode == 'shift_to_left': + if intersection_mode == 'shift_to_left': boundaries[0, i + 1] = boundaries[1, i] elif intersection_mode == 'shift_to_right': boundaries[1, i] = boundaries[0, i + 1] @@ -120,6 +125,7 @@ def get_boundaries(idx, actual_timestamps, window_size:int = None, boundaries = pd.DataFrame({'lower': boundaries[0], 'upper': boundaries[1]}) return boundaries + def nab(boundaries, predictions, mode='standard', custom_coefs=None): inner_coefs = { 'low_FP': [1.0, -0.11, -1.0], @@ -128,11 +134,9 @@ def nab(boundaries, predictions, mode='standard', custom_coefs=None): } coefs = custom_coefs or inner_coefs[mode] confusion_matrix = extract_cp_cm(boundaries, predictions) - + tps = confusion_matrix['tps'] - score = np.inner([tps, len(confusion_matrix['FP']), len(confusion_matrix['FN'])], + score = np.inner([tps, len(confusion_matrix['FP']), len(confusion_matrix['FN'])], coefs) return score - - diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index b72a927f1..03551dbc7 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -4,10 +4,11 @@ from fedot_ind.core.architecture.settings.computational import backend_methods as np from fedot_ind.core.models.early_tc.base_early_tc import BaseETC + class ProbabilityThresholdClassifier(BaseETC): def __init__(self, params: Optional[OperationParameters] = None): if params is None: - params = {} + params = {} super().__init__(params) self.probability_threshold = params.get('probability_threshold', None) @@ -15,7 +16,7 @@ def _init_model(self, X, y): super()._init_model(X, y) if self.probability_threshold is None: self.probability_threshold = 1 / len(self.classes_[0]) - + def predict_proba(self, X): _, predicted_probas, non_acceptance = self._predict(X, training=False) predicted_probas[non_acceptance] = 0 @@ -33,11 +34,11 @@ def _score(self, X, y, accuracy_importance=None): scores = super()._score(X, y, accuracy_importance) self._chosen_estimator_idx = np.argmax(scores) return scores - + def fit(self, X, y): super().fit(X, y) self._score(X, y, self.accuracy_importance) - + def _transform_score(self, confidences): thr = self.probability_threshold confidences = confidences - thr diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 0350d0886..6d7c4470f 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -8,7 +8,7 @@ class TEASER(BaseETC): - def __init__(self, params: Optional[OperationParameters] = None): + def __init__(self, params: Optional[OperationParameters] = None): super().__init__(params) self._oc_svm_params = (100., 10., 5., 2.5, 1.5, 1., 0.5, 0.25, 0.1) @@ -18,29 +18,29 @@ def _init_model(self, X, y): def _fit_one_interval(self, X, y, i): probas = super()._fit_one_interval(X, y, i) - filtered_probas = self._filter_trues(probas, y) # + filtered_probas = self._filter_trues(probas, y) X_oc = self._form_X_oc(filtered_probas) self.oc_estimators[i] = GridSearchCV(OneClassSVM(), - param_grid={"gamma": self._oc_svm_params}, - scoring='accuracy', - cv=min(X.shape[0], 10) - ).fit(X_oc, np.ones((len(X_oc), 1))).best_estimator_ + param_grid={"gamma": self._oc_svm_params}, + scoring='accuracy', + cv=min(X.shape[0], 10) + ).fit(X_oc, np.ones((len(X_oc), 1))).best_estimator_ def _predict_one_slave(self, X, i, offset=0): probas, labels = super()._predict_one_slave(X, i, offset) X_oc = self._form_X_oc(probas) return X_oc, probas, labels - - def _filter_trues(self, predicted_probas, y): # different logic in sktime + + def _filter_trues(self, predicted_probas, y): # different logic in sktime predicted_labels = np.argmax(predicted_probas, axis=-1).flatten() return predicted_probas[predicted_labels == y] - + def _form_X_oc(self, predicted_probas): d = (predicted_probas.max() - predicted_probas) d[d == 0] = 1 d = d.min(axis=-1).reshape(-1, 1) return np.hstack([predicted_probas, d]) - + def _predict(self, X, training=False): estimator_indices, offset = self._select_estimators(X) X_ocs, predicted_probas, predicted_labels = map(np.stack, zip( @@ -48,30 +48,30 @@ def _predict(self, X, training=False): )) non_acceptance = self._consecutive_count(predicted_labels) < self.consecutive_predictions final_verdicts = np.zeros((len(estimator_indices), X.shape[0])) - # for each point of estimation + # for each point of estimation for i in range(predicted_labels.shape[0]): # find not accepted points X_to_ith = X_ocs[i] # if they are not outliers final_verdict = self.oc_estimators[estimator_indices[i]].decision_function(X_to_ith) # mark as accepted - final_verdicts[i] = final_verdict + final_verdicts[i] = final_verdict non_acceptance[non_acceptance & (final_verdict > 0)] = False return predicted_labels, predicted_probas, non_acceptance, final_verdicts - + def predict_proba(self, X): _, predicted_probas, non_acceptance, final_verdicts = self._predict(X) predicted_probas[non_acceptance] = final_verdicts[non_acceptance, None] return super().predict_proba(predicted_probas, final_verdicts) - + def _score(self, X, y, accuracy_importance=None): scores = super()._score(X, y, accuracy_importance) self._chosen_estimator_idx = np.argmax(scores) return scores - + def fit(self, X, y): super().fit(X, y) return self._score(X, y, self.accuracy_importance) - + def _transform_score(self, scores): return np.tanh(scores) diff --git a/fedot_ind/core/models/nn/network_impl/base_nn_model.py b/fedot_ind/core/models/nn/network_impl/base_nn_model.py index f285853d0..d76737d6a 100644 --- a/fedot_ind/core/models/nn/network_impl/base_nn_model.py +++ b/fedot_ind/core/models/nn/network_impl/base_nn_model.py @@ -123,9 +123,9 @@ def _train_one_batch(self, batch, optimizer, loss_fn): training_loss = loss.data.item() * inputs.size(0) total = targets.size(0) correct = (torch.argmax(output, 1) == - torch.argmax(targets, 1)).sum().item() + torch.argmax(targets, 1)).sum().item() return training_loss, total, correct - + def _eval_one_batch(self, batch, loss_fn): inputs, targets = batch output = self.model(inputs) @@ -133,11 +133,11 @@ def _eval_one_batch(self, batch, loss_fn): valid_loss = loss.data.item() * inputs.size(0) total = targets.size(0) correct = (torch.argmax(output, 1) == - torch.argmax(targets, 1)).sum().item() + torch.argmax(targets, 1)).sum().item() return valid_loss, total, correct def _run_one_epoch(self, train_loader, val_loader, - optimizer, loss_fn, + optimizer, loss_fn, epoch, val_interval, early_stopping, scheduler, best_val_loss): @@ -172,7 +172,7 @@ def _run_one_epoch(self, train_loader, val_loader, early_stopping(training_loss, self.model, './') adjust_learning_rate(optimizer, scheduler, - epoch + 1, self.learning_rate, printout=False) + epoch + 1, self.learning_rate, printout=False) scheduler.step() return best_model, best_val_loss @@ -188,7 +188,7 @@ def _train_loop(self, train_loader, val_loader, loss_fn, optimizer): best_val_loss = float('inf') val_interval = self.get_validation_frequency( self.epochs, self.learning_rate) - loss_prefix = 'RMSE' if self.is_regression_task else 'Accuracy' + 'RMSE' if self.is_regression_task else 'Accuracy' for epoch in range(1, self.epochs + 1): best_model, best_val_loss = self._run_one_epoch( train_loader, val_loader, diff --git a/fedot_ind/core/models/nn/network_impl/mlstm.py b/fedot_ind/core/models/nn/network_impl/mlstm.py index 604f28660..627eaf8a1 100644 --- a/fedot_ind/core/models/nn/network_impl/mlstm.py +++ b/fedot_ind/core/models/nn/network_impl/mlstm.py @@ -1,69 +1,65 @@ -import copy from fedot_ind.core.models.nn.network_impl.base_nn_model import BaseNeuralModel -from typing import Optional, Callable, Any, List, Union +from typing import Optional from fedot.core.operations.operation_parameters import OperationParameters -from fedot.core.data.data import InputData, OutputData -from fedot_ind.core.repository.constanst_repository import CROSS_ENTROPY, MULTI_CLASS_CROSS_ENTROPY, RMSE +from fedot.core.data.data import InputData +from fedot_ind.core.repository.constanst_repository import CROSS_ENTROPY import torch.optim as optim -import torch.optim.lr_scheduler as lr_scheduler import torch.nn as nn import torch.nn.functional as F import torch -from tqdm import tqdm from fedot_ind.core.architecture.settings.computational import backend_methods as np from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array -import pandas as pd -from fedot_ind.core.models.nn.network_modules.layers.special import adjust_learning_rate, EarlyStopping -import torch.utils.data as data + class SqueezeExciteBlock(nn.Module): - def __init__(self, input_channels, filters, reduce=4): - super().__init__() - self.filters = filters - self.pool = nn.AvgPool1d(input_channels) - self.bottleneck = max(self.filters // reduce, 4) - self.fc1 = nn.Linear(self.filters, self.bottleneck, bias=False) - self.fc2 = nn.Linear(self.bottleneck, self.filters, bias=False) - torch.nn.init.kaiming_normal_(self.fc1.weight.data) - torch.nn.init.kaiming_normal_(self.fc2.weight.data) - - def forward(self, x): - input_x = x - x = self.pool(x) - x = F.relu(self.fc1(x.view(-1, 1, self.filters))) - x = F.sigmoid(self.fc2(x)) - x = x.view(-1, self.filters, 1) * input_x - return x + def __init__(self, input_channels, filters, reduce=4): + super().__init__() + self.filters = filters + self.pool = nn.AvgPool1d(input_channels) + self.bottleneck = max(self.filters // reduce, 4) + self.fc1 = nn.Linear(self.filters, self.bottleneck, bias=False) + self.fc2 = nn.Linear(self.bottleneck, self.filters, bias=False) + torch.nn.init.kaiming_normal_(self.fc1.weight.data) + torch.nn.init.kaiming_normal_(self.fc2.weight.data) + + def forward(self, x): + input_x = x + x = self.pool(x) + x = F.relu(self.fc1(x.view(-1, 1, self.filters))) + x = F.sigmoid(self.fc2(x)) + x = x.view(-1, self.filters, 1) * input_x + return x + class MLSTM_module(nn.Module): def __init__(self, input_size, input_channels, - inner_size, inner_channels, + inner_size, inner_channels, output_size, num_layers, dropout=0.25): super().__init__() self.proj = nn.Linear(input_size * inner_channels + input_channels * inner_size, output_size) self.lstm = nn.LSTM(input_size, inner_size, num_layers, - batch_first=True, dropout=dropout) - - squeeze_excite_size = input_size #if not interval else interval + batch_first=True, dropout=dropout) + + squeeze_excite_size = input_size # if not interval else interval self.conv_branch = nn.Sequential( nn.Conv1d(input_channels, inner_channels, padding='same', - kernel_size=9), + kernel_size=9), nn.BatchNorm1d(inner_channels), nn.ReLU(), SqueezeExciteBlock(squeeze_excite_size, inner_channels), nn.Conv1d(inner_channels, inner_channels * 2, padding='same', kernel_size=5, - ), # c x l | n x c x l - nn.BatchNorm1d(inner_channels * 2), # n x c | n x c x l + ), # c x l | n x c x l + nn.BatchNorm1d(inner_channels * 2), # n x c | n x c x l nn.ReLU(), SqueezeExciteBlock(squeeze_excite_size, inner_channels * 2), nn.Conv1d(inner_channels * 2, inner_channels, padding='same', kernel_size=3, - ), # c x l | n x c x l - nn.BatchNorm1d(inner_channels), # n x c | n x c x l + ), # c x l | n x c x l + nn.BatchNorm1d(inner_channels), # n x c | n x c x l nn.ReLU(), ) seq = next(iter(self.conv_branch.modules())) @@ -72,8 +68,8 @@ def __init__(self, input_size, input_channels, torch.nn.init.kaiming_uniform_(seq[i].weight.data) def forward(self, x, hidden_state=None, return_hidden=False): - x_lstm, hidden_state = self.lstm(x, hidden_state) # n x input_ch x inner_size - x_conv = self.conv_branch(x) # n x inner_ch x len + x_lstm, hidden_state = self.lstm(x, hidden_state) # n x input_ch x inner_size + x_conv = self.conv_branch(x) # n x inner_ch x len x = torch.cat([torch.flatten(x_lstm, start_dim=1), torch.flatten(x_conv, start_dim=1)], dim=-1) x = F.softmax(self.proj(x)) if return_hidden: @@ -84,7 +80,7 @@ def forward(self, x, hidden_state=None, return_hidden=False): class MLSTM(BaseNeuralModel): def __init__(self, params: Optional[OperationParameters] = None): if params is None: - params = {} + params = {} super().__init__() self.dropout = params.get('dropout', 0.25) self.hidden_size = params.get('hidden_size', 64) @@ -94,34 +90,34 @@ def __init__(self, params: Optional[OperationParameters] = None): self.min_ts_length = params.get('min_ts_length', 5) self.fitting_mode = params.get('fitting_mode', 'zero_padding') self.proba_thr = params.get('proba_thr', None) - + def __repr__(self): return 'MLSTM' - + def _compute_prediction_points(self, n_idx): interval_length = max(int(n_idx * self.interval_percentage / 100), self.min_ts_length) prediction_idx = np.arange(interval_length - 1, n_idx, interval_length) - self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 + self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 return prediction_idx, interval_length def _init_model(self, ts: InputData): _, input_channels, input_size = ts.features.shape self.input_size = input_size self.prediction_idx, self.interval = self._compute_prediction_points(input_size) - self.model = MLSTM_module(input_size if self.fitting_mode != 'moving_window' else self.interval, - input_channels, - self.hidden_size, self.hidden_channels, - self.num_classes, self.num_layers, - self.dropout) - self.model_for_inference = MLSTM_module(input_size if self.fitting_mode != 'moving_window' else self.interval, + self.model = MLSTM_module(input_size if self.fitting_mode != 'moving_window' else self.interval, input_channels, self.hidden_size, self.hidden_channels, self.num_classes, self.num_layers, self.dropout) + self.model_for_inference = MLSTM_module(input_size if self.fitting_mode != 'moving_window' else self.interval, + input_channels, + self.hidden_size, self.hidden_channels, + self.num_classes, self.num_layers, + self.dropout) optimizer = optim.Adam(self.model.parameters(), lr=0.001) loss_fn = CROSS_ENTROPY() return loss_fn, optimizer - + @convert_to_3d_torch_array def _fit_model(self, ts: InputData): mode = self.fitting_mode @@ -144,17 +140,17 @@ def _fit_model(self, ts: InputData): ) else: raise ValueError('Unknown fitting mode') - + def _moving_window_output(self, inputs): hidden_state = None output = -torch.ones((inputs.shape[0], self.num_classes)) for i in self.prediction_idx: if i >= inputs.shape[-1]: break - batch_interval = inputs[..., i - self.prediction_idx[0] : i + 1] + batch_interval = inputs[..., i - self.prediction_idx[0]: i + 1] output, hidden_state = self.model(batch_interval, hidden_state, return_hidden=True) return output - + def _train_one_batch(self, batch, optimizer, loss_fn): if self.fitting_mode == 'zero_padding': return super()._train_one_batch(batch, optimizer, loss_fn) @@ -168,11 +164,11 @@ def _train_one_batch(self, batch, optimizer, loss_fn): training_loss = loss.data.item() * inputs.size(0) total = targets.size(0) correct = (torch.argmax(output, 1) == - torch.argmax(targets, 1)).sum().item() + torch.argmax(targets, 1)).sum().item() return training_loss, total, correct else: raise ValueError('Unknown fitting mode!') - + def _eval_one_batch(self, batch, loss_fn): if self.fitting_mode == 'zero_padding': return super()._eval_one_batch(batch, loss_fn) @@ -183,7 +179,7 @@ def _eval_one_batch(self, batch, loss_fn): valid_loss = loss.data.item() * inputs.size(0) total = targets.size(0) correct = (torch.argmax(output, 1) == - torch.argmax(targets, 1)).sum().item() + torch.argmax(targets, 1)).sum().item() return valid_loss, total, correct else: raise ValueError('Unknown fitting mode!') @@ -199,7 +195,7 @@ def _predict_model(self, x_test: InputData, output_mode: str = 'default'): else: raise ValueError('Unknown prediction mode') return self._convert_predict(pred, output_mode) - + def _padding(self, ts: np.array): if ts.shape[-1] == self.input_size: return torch.tensor(ts).float() @@ -221,7 +217,7 @@ def _augment_with_zeros(self, batch: np.array): y_res = np.concatenate(y_res) perm = np.random.permutation(X_res.shape[0]) return torch.tensor(X_res[perm]), torch.tensor(y_res[perm]) - + def _transform_score(self, probas): # linear interp thr = self.proba_thr diff --git a/fedot_ind/core/tuning/search_space.py b/fedot_ind/core/tuning/search_space.py index 832eaad26..7be4c626d 100644 --- a/fedot_ind/core/tuning/search_space.py +++ b/fedot_ind/core/tuning/search_space.py @@ -67,29 +67,29 @@ }, 'ecec': { 'interval_percentage': {'hyperopt-dist': hp.choice, - 'sampling-scope': [[5, 10, 20, 25]]}, + 'sampling-scope': [[5, 10, 20, 25]]}, 'accuracy_importance': {'hyperopt-dist': hp.choice, - 'sampling-scope': [[i / 10 for i in range(11)]]}, + 'sampling-scope': [[i / 10 for i in range(11)]]}, }, 'economy_k': { 'interval_percentage': {'hyperopt-dist': hp.choice, - 'sampling-scope': [[5, 10, 20, 25]]}, + 'sampling-scope': [[5, 10, 20, 25]]}, 'lambda': {'hyperopt-dist': hp.choice, 'sampling-scope': [[1e-6, 1e-3, 1e-2, 1e-1, 1, 1e1, 1e2, 1e3, 1e4, 1e6]]}, 'accuracy_importance': {'hyperopt-dist': hp.choice, - 'sampling-scope': [[i / 10 for i in range(11)]]}, + 'sampling-scope': [[i / 10 for i in range(11)]]}, }, 'mlstm_model': { 'interval_percentage': {'hyperopt-dist': hp.choice, - 'sampling-scope': [[5, 10, 20, 25]]}, + 'sampling-scope': [[5, 10, 20, 25]]}, 'dropout': {'hyperopt-dist': hp.choice, 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5]]}, 'hidden_size': {'hyperopt-dist': hp.choice, - 'sampling-scope': [list(range(10, 101, 10))]}, + 'sampling-scope': [list(range(10, 101, 10))]}, 'num_layers': {'hyperopt-dist': hp.choice, - 'sampling-scope': [list(range(1, 6))]}, + 'sampling-scope': [list(range(1, 6))]}, 'hidden_channels': {'hyperopt-dist': hp.choice, - 'sampling-scope': [8, 16, 32, 64, 96]}, + 'sampling-scope': [8, 16, 32, 64, 96]}, }, 'proba_threshold_etc': {'interval_percentage': {'hyperopt-dist': hp.choice, @@ -97,32 +97,32 @@ 'acceptance_threshold': {'hyperopt-dist': hp.choice, 'sampling_scope': [[1, 2, 3, 4, 5]]}, 'accuracy_importance': {'hyperopt-dist': hp.choice, - 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1,]]}, - }, + 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1,]]}, + }, 'teaser': {'interval_percentage': {'hyperopt-dist': hp.choice, 'sampling-scope': [[5, 10, 20, 25]]}, 'acceptance_threshold': {'hyperopt-dist': hp.choice, 'sampling_scope': [[1, 2, 3, 4, 5]]}, 'accuracy_importance': {'hyperopt-dist': hp.choice, - 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1,]]}, - }, - 'deepar_model': - {'epochs': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1,]]}, + }, + 'deepar_model': + {'epochs': {'hyperopt-dist': hp.choice, 'sampling-scope': [[x for x in range(10, 100, 10)]]}, 'batch_size': {'hyperopt-dist': hp.choice, 'sampling-scope': [[x for x in range(8, 64, 6)]]}, - 'dropout': {'hyperopt-dist': hp.choice, - 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5]]}, - 'rnn_layers':{'hyperopt-dist': hp.choice, - 'sampling-scope': [list(range(1, 6))]}, - 'hidden_size':{'hyperopt-dist': hp.choice, - 'sampling-scope': [list(range(10, 101, 10))]}, - 'cell_type':{'hyperopt-dist': hp.choice, - 'sampling-scope': [['GRU', 'LSTM', 'RNN']]}, - 'expected_distribution': {'hyperopt-dist': hp.choice, - 'sampling-scope': [['normal', 'cauchy']]} - }, + 'dropout': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5]]}, + 'rnn_layers': {'hyperopt-dist': hp.choice, + 'sampling-scope': [list(range(1, 6))]}, + 'hidden_size': {'hyperopt-dist': hp.choice, + 'sampling-scope': [list(range(10, 101, 10))]}, + 'cell_type': {'hyperopt-dist': hp.choice, + 'sampling-scope': [['GRU', 'LSTM', 'RNN']]}, + 'expected_distribution': {'hyperopt-dist': hp.choice, + 'sampling-scope': [['normal', 'cauchy']]} + }, 'patch_tst_model': {'epochs': {'hyperopt-dist': hp.choice, 'sampling-scope': [[x for x in range(10, 100, 10)]]}, 'batch_size': {'hyperopt-dist': hp.choice, 'sampling-scope': [[x for x in range(8, 64, 6)]]}, diff --git a/tests/unit/core/models/test_teaser.py b/tests/unit/core/models/test_teaser.py index 2bc19b8de..1cf847f67 100644 --- a/tests/unit/core/models/test_teaser.py +++ b/tests/unit/core/models/test_teaser.py @@ -8,10 +8,12 @@ def teaser(): teaser = TEASER.TEASER({'interval_length': 10, 'prediction_mode': ''}) return teaser + @pytest.fixture(scope='module') def xy(): return np.random.randn((2, 23)), np.random.randint(0, 2, size=(2, 1)) + def test_get_applicable_index(teaser): teaser._init_model(23) idx, offset = teaser._get_last_applicable_idx(100) @@ -21,6 +23,7 @@ def test_get_applicable_index(teaser): assert offset == 100 - teaser.prediction_idx[idx], 'Wrong offset estimation in the middle' assert idx == len(teaser.prediction_idx) - 1 + def test_compute_prediction_points(teaser): indices = teaser._compute_prediction_points(23) assert 2 in indices @@ -31,5 +34,3 @@ def test_compute_prediction_points(teaser): # pass # def test_score(teaser): - - From c2126eda06f46441cf3314055d40d8ce91c0ee73 Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 28 Jun 2024 14:11:17 +0300 Subject: [PATCH 33/43] both etc models are registered, available via api --- .../repository/data/industrial_model_repository.json | 10 ++++++++++ fedot_ind/core/repository/model_repository.py | 1 + fedot_ind/core/tuning/search_space.py | 8 ++++++++ 3 files changed, 19 insertions(+) diff --git a/fedot_ind/core/repository/data/industrial_model_repository.json b/fedot_ind/core/repository/data/industrial_model_repository.json index 9b624321f..145aa979c 100644 --- a/fedot_ind/core/repository/data/industrial_model_repository.json +++ b/fedot_ind/core/repository/data/industrial_model_repository.json @@ -773,6 +773,16 @@ ], "input_type": "[DataTypesEnum.table]" }, + "proba_threshold_etc": { + "meta": "sklearn_class", + "tags": [ + "simple", + "interpretable", + "non_lagged", + "non_linear" + ], + "input_type": "[DataTypesEnum.table]" + }, "xgboost": { "meta": "sklearn_class", "presets": ["*tree"], diff --git a/fedot_ind/core/repository/model_repository.py b/fedot_ind/core/repository/model_repository.py index c3e226dc7..e79eea250 100644 --- a/fedot_ind/core/repository/model_repository.py +++ b/fedot_ind/core/repository/model_repository.py @@ -49,6 +49,7 @@ from fedot_ind.core.models.early_tc.economy_k import EconomyK from fedot_ind.core.models.early_tc.prob_threshold import ProbabilityThresholdClassifier from fedot_ind.core.models.early_tc.teaser import TEASER +from fedot_ind.core.models.early_tc.prob_threshold import ProbabilityThresholdClassifier from fedot_ind.core.models.manifold.riemann_embeding import RiemannExtractor from fedot_ind.core.models.nn.network_impl.dummy_nn import DummyOverComplicatedNeuralNetwork from fedot_ind.core.models.nn.network_impl.deepar import DeepAR diff --git a/fedot_ind/core/tuning/search_space.py b/fedot_ind/core/tuning/search_space.py index 832eaad26..2f1889a96 100644 --- a/fedot_ind/core/tuning/search_space.py +++ b/fedot_ind/core/tuning/search_space.py @@ -107,6 +107,14 @@ 'accuracy_importance': {'hyperopt-dist': hp.choice, 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1,]]}, }, + 'proba_threshold_etc': + {'interval_percentage': {'hyperopt-dist': hp.choice, + 'sampling-scope': [[5, 10, 20, 25]]}, + 'acceptance_threshold': {'hyperopt-dist': hp.choice, + 'sampling_scope': [[1, 2, 3, 4, 5]]}, + 'hm_shift_to_acc': {'hyperopt-dist': hp.choice, + 'sampling-scope': [0.01, 0.1, 0.5, 1, 5, 10, 100]}, + }, 'deepar_model': {'epochs': {'hyperopt-dist': hp.choice, 'sampling-scope': [[x for x in range(10, 100, 10)]]}, From 143b7a2580b8b5459eb15eaf7a69173109166e57 Mon Sep 17 00:00:00 2001 From: leostre Date: Tue, 9 Jul 2024 14:33:24 +0300 Subject: [PATCH 34/43] fitting w augmentation --- fedot_ind/core/models/nn/network_impl/mlstm.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/fedot_ind/core/models/nn/network_impl/mlstm.py b/fedot_ind/core/models/nn/network_impl/mlstm.py index 604f28660..9a22d7108 100644 --- a/fedot_ind/core/models/nn/network_impl/mlstm.py +++ b/fedot_ind/core/models/nn/network_impl/mlstm.py @@ -11,7 +11,7 @@ import torch from tqdm import tqdm from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array +from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array, fedot_data_type import pandas as pd from fedot_ind.core.models.nn.network_modules.layers.special import adjust_learning_rate, EarlyStopping import torch.utils.data as data From ded4f22944f1a9c7b4e4635e3bb2fb2a6b28a6c5 Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 12 Jul 2024 01:27:24 +0300 Subject: [PATCH 35/43] all work, but need eval --- fedot_ind/core/models/early_tc/base_early_tc.py | 3 +++ fedot_ind/core/models/early_tc/economy_k.py | 1 + 2 files changed, 4 insertions(+) diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index 9c8e12cb8..d488e22b0 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -77,6 +77,9 @@ def _select_estimators(self, X, training=False): elif training or self.prediction_mode == 'all': last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) estimator_indices = np.arange(last_idx + 1) + elif 'last_available': + last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) + estimator_indices = [last_idx] else: raise ValueError('Unknown prediction mode') return estimator_indices, offset diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py index 481cad97b..9958d408d 100644 --- a/fedot_ind/core/models/early_tc/economy_k.py +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -15,6 +15,7 @@ def __init__(self, params: Optional[OperationParameters] = None): self.prediction_mode = params.get('prediction_mode', 'last_available') self.lambda_ = params.get('lambda', 1.) self._cluster_factor = params.get('cluster_factor' , 1) + # self.confidence_mode = params.get('confidence_mode', 'time') # or 'confidence' self._random_state = 2104 self.__cv = 5 From 40afba90572107649b8316128b64fc5e433c173d Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 12 Jul 2024 12:09:39 +0300 Subject: [PATCH 36/43] evth converged to one interface + refactored --- fedot_ind/core/models/early_tc/base_early_tc.py | 3 --- fedot_ind/core/models/early_tc/ecec.py | 2 ++ fedot_ind/core/models/early_tc/economy_k.py | 1 - fedot_ind/core/models/nn/network_impl/mlstm.py | 2 +- .../repository/data/industrial_model_repository.json | 11 ++++++++++- fedot_ind/core/repository/model_repository.py | 1 - fedot_ind/core/tuning/search_space.py | 2 +- 7 files changed, 14 insertions(+), 8 deletions(-) diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index d488e22b0..9c8e12cb8 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -77,9 +77,6 @@ def _select_estimators(self, X, training=False): elif training or self.prediction_mode == 'all': last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) estimator_indices = np.arange(last_idx + 1) - elif 'last_available': - last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) - estimator_indices = [last_idx] else: raise ValueError('Unknown prediction mode') return estimator_indices, offset diff --git a/fedot_ind/core/models/early_tc/ecec.py b/fedot_ind/core/models/early_tc/ecec.py index 576b3a4ba..b83cc3254 100644 --- a/fedot_ind/core/models/early_tc/ecec.py +++ b/fedot_ind/core/models/early_tc/ecec.py @@ -25,6 +25,8 @@ def _predict(self, X, training=False): predicted_labels, predicted_probas, reliabilities = super()._predict(X, training) confidences = 1 - np.cumprod(1 - reliabilities, axis=0) non_confident = confidences < self.confidence_thresholds[:len(predicted_labels), None] + predicted_labels = np.stack(predicted_labels) + predicted_probas = np.stack(predicted_probas) return predicted_labels, predicted_probas, non_confident, confidences def predict_proba(self, X): diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py index 9958d408d..481cad97b 100644 --- a/fedot_ind/core/models/early_tc/economy_k.py +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -15,7 +15,6 @@ def __init__(self, params: Optional[OperationParameters] = None): self.prediction_mode = params.get('prediction_mode', 'last_available') self.lambda_ = params.get('lambda', 1.) self._cluster_factor = params.get('cluster_factor' , 1) - # self.confidence_mode = params.get('confidence_mode', 'time') # or 'confidence' self._random_state = 2104 self.__cv = 5 diff --git a/fedot_ind/core/models/nn/network_impl/mlstm.py b/fedot_ind/core/models/nn/network_impl/mlstm.py index 9a22d7108..604f28660 100644 --- a/fedot_ind/core/models/nn/network_impl/mlstm.py +++ b/fedot_ind/core/models/nn/network_impl/mlstm.py @@ -11,7 +11,7 @@ import torch from tqdm import tqdm from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array, fedot_data_type +from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array import pandas as pd from fedot_ind.core.models.nn.network_modules.layers.special import adjust_learning_rate, EarlyStopping import torch.utils.data as data diff --git a/fedot_ind/core/repository/data/industrial_model_repository.json b/fedot_ind/core/repository/data/industrial_model_repository.json index 145aa979c..b05cb3c95 100644 --- a/fedot_ind/core/repository/data/industrial_model_repository.json +++ b/fedot_ind/core/repository/data/industrial_model_repository.json @@ -766,7 +766,6 @@ "teaser": { "meta": "sklearn_class", "tags": [ - "simple", "interpretable", "non_lagged", "non_linear" @@ -783,6 +782,16 @@ ], "input_type": "[DataTypesEnum.table]" }, + "teaser": { + "meta": "sklearn_class", + "tags": [ + "simple", + "interpretable", + "non_lagged", + "non_linear" + ], + "input_type": "[DataTypesEnum.table]" + }, "xgboost": { "meta": "sklearn_class", "presets": ["*tree"], diff --git a/fedot_ind/core/repository/model_repository.py b/fedot_ind/core/repository/model_repository.py index e79eea250..c3e226dc7 100644 --- a/fedot_ind/core/repository/model_repository.py +++ b/fedot_ind/core/repository/model_repository.py @@ -49,7 +49,6 @@ from fedot_ind.core.models.early_tc.economy_k import EconomyK from fedot_ind.core.models.early_tc.prob_threshold import ProbabilityThresholdClassifier from fedot_ind.core.models.early_tc.teaser import TEASER -from fedot_ind.core.models.early_tc.prob_threshold import ProbabilityThresholdClassifier from fedot_ind.core.models.manifold.riemann_embeding import RiemannExtractor from fedot_ind.core.models.nn.network_impl.dummy_nn import DummyOverComplicatedNeuralNetwork from fedot_ind.core.models.nn.network_impl.deepar import DeepAR diff --git a/fedot_ind/core/tuning/search_space.py b/fedot_ind/core/tuning/search_space.py index 2f1889a96..05b844998 100644 --- a/fedot_ind/core/tuning/search_space.py +++ b/fedot_ind/core/tuning/search_space.py @@ -107,7 +107,7 @@ 'accuracy_importance': {'hyperopt-dist': hp.choice, 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1,]]}, }, - 'proba_threshold_etc': + 'teaser': {'interval_percentage': {'hyperopt-dist': hp.choice, 'sampling-scope': [[5, 10, 20, 25]]}, 'acceptance_threshold': {'hyperopt-dist': hp.choice, From d6ad8fda9a704823a1fda17267b7681a86b5d1cb Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 12 Jul 2024 15:02:54 +0300 Subject: [PATCH 37/43] slight fixes --- fedot_ind/core/tuning/search_space.py | 8 -------- 1 file changed, 8 deletions(-) diff --git a/fedot_ind/core/tuning/search_space.py b/fedot_ind/core/tuning/search_space.py index 05b844998..832eaad26 100644 --- a/fedot_ind/core/tuning/search_space.py +++ b/fedot_ind/core/tuning/search_space.py @@ -107,14 +107,6 @@ 'accuracy_importance': {'hyperopt-dist': hp.choice, 'sampling-scope': [[0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1,]]}, }, - 'teaser': - {'interval_percentage': {'hyperopt-dist': hp.choice, - 'sampling-scope': [[5, 10, 20, 25]]}, - 'acceptance_threshold': {'hyperopt-dist': hp.choice, - 'sampling_scope': [[1, 2, 3, 4, 5]]}, - 'hm_shift_to_acc': {'hyperopt-dist': hp.choice, - 'sampling-scope': [0.01, 0.1, 0.5, 1, 5, 10, 100]}, - }, 'deepar_model': {'epochs': {'hyperopt-dist': hp.choice, 'sampling-scope': [[x for x in range(10, 100, 10)]]}, From 8fec47f82fe63417a37e6fca04f9701210387816 Mon Sep 17 00:00:00 2001 From: leostre Date: Mon, 22 Jul 2024 17:32:52 +0300 Subject: [PATCH 38/43] added tests and notebook --- .../early_classification_example.ipynb | 588 ++++++++++++++++++ fedot_ind/core/metrics/interval_metrics.py | 3 +- .../core/metrics/metrics_implementation.py | 12 +- .../core/models/early_tc/base_early_tc.py | 50 +- fedot_ind/core/models/early_tc/ecec.py | 12 +- fedot_ind/core/models/early_tc/economy_k.py | 25 +- .../core/models/early_tc/prob_threshold.py | 21 +- fedot_ind/core/models/early_tc/teaser.py | 30 +- .../models/nn/network_impl/base_nn_model.py | 15 +- .../core/models/nn/network_impl/mlstm.py | 30 +- .../models/nn/network_impl/transformer.py | 2 + .../models/quantile/quantile_extractor.py | 2 +- .../data/industrial_model_repository.json | 4 +- .../unit/core/models/model_impl/test_mlstm.py | 37 ++ tests/unit/core/models/test_etc.py | 98 +++ 15 files changed, 866 insertions(+), 63 deletions(-) create mode 100644 examples/real_world_examples/industrial_examples/early_classification_example.ipynb create mode 100644 tests/unit/core/models/model_impl/test_mlstm.py create mode 100644 tests/unit/core/models/test_etc.py diff --git a/examples/real_world_examples/industrial_examples/early_classification_example.ipynb b/examples/real_world_examples/industrial_examples/early_classification_example.ipynb new file mode 100644 index 000000000..bd6f5fab0 --- /dev/null +++ b/examples/real_world_examples/industrial_examples/early_classification_example.ipynb @@ -0,0 +1,588 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Load data" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "For the following Early time series classification models let's load some univariate data" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "from fedot_ind.api.utils.path_lib import PROJECT_PATH\n", + "import sys\n", + "import os\n", + "\n", + "if not os.getcwd() == PROJECT_PATH:\n", + " os.chdir(PROJECT_PATH)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [], + "source": [ + "from fedot.core.data.data import InputData\n", + "from fedot.core.repository.dataset_types import DataTypesEnum\n", + "from fedot.core.repository.tasks import Task, TaskTypesEnum\n", + "from fedot_ind.api.utils.path_lib import PROJECT_PATH\n", + "from fedot_ind.core.architecture.settings.computational import backend_methods as np\n", + "import matplotlib.pyplot as plt\n", + "import seaborn as sns\n", + "from tqdm.autonotebook import tqdm" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2024-07-22 13:42:16,908 - PyTorch version 2.2.2 available.\n" + ] + } + ], + "source": [ + "from fedot_ind.tools.loader import DataLoader\n", + "\n", + "def load_univariate_classification():\n", + " dl = DataLoader('Lightning7')\n", + " (train_series, train_labels), (test_series, test_labels) = dl.load_data()\n", + " train_data = InputData(idx=np.arange(test_series.shape[1]),\n", + " features=train_series.values,\n", + " target=train_labels,\n", + " task=Task(TaskTypesEnum.classification),\n", + " data_type=DataTypesEnum.table)\n", + " test_data = InputData(idx=np.arange(test_series.shape[1]),\n", + " features=test_series.values,\n", + " target=test_labels,\n", + " task=Task(TaskTypesEnum.classification),\n", + " data_type=DataTypesEnum.table)\n", + " return train_data, test_data\n" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Shape of train_data.features: (70, 319)\n", + "test_data shape: (73, 319)\n", + "Number of classes: 7\n" + ] + } + ], + "source": [ + "train_data, test_data = load_univariate_classification()\n", + "print(f'Shape of train_data.features: {train_data.features.shape}\\ntest_data shape: {test_data.features.shape}')\n", + "print('Number of classes:', len(np.unique(train_data.target)))" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "plt.bar(*(np.unique(train_data.target, return_counts=True)))\n", + "plt.ylabel('Count')\n", + "plt.xlabel('Class')\n", + "plt.yticks(np.arange(0, 21, 2));\n", + "plt.grid(axis='y');" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Standalone models" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "All the models presented below share the same principle of functioning:\n", + "\n", + "Since there's no way for many classifiers to support inference for different data sizes, the basic Early ETSC class implements fitting of multiple slave estimators according to the specified intervals (by *interval_percentage* key word) on time series instance. Depending on the length of features passed and *prediction_mode* parameter the appropriate subset if classifiers is selected and inference is committed. The details of fitting and inference vary drastically. " + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "from fedot_ind.core.models.early_tc import base_early_tc as BASE_ETC\n", + "from importlib import reload\n", + "\n", + "Xtr, ytr = train_data.features.squeeze(), train_data.target\n", + "Xte, yte = test_data.features.squeeze(), test_data.target\n", + "\n", + "INTEVAL_PERCENTAGE = 10\n", + "earliness = np.round((1 - np.arange(0, Xtr.shape[0], int(INTEVAL_PERCENTAGE * Xtr.shape[0] / 100)) / Xtr.shape[0]) * 100)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 198, + "metadata": {}, + "outputs": [], + "source": [ + "from fedot_ind.core.metrics.metrics_implementation import ETSCPareto\n", + "\n", + "def eval_param_influence(model, prm_name, options, **model_kw):\n", + " r = {}\n", + " for option in tqdm(options, desc='Options'):\n", + " model_ = model({prm_name: option, **model_kw})\n", + " model_.fit(Xtr, ytr)\n", + " labels, scores = model_.predict(Xte)\n", + " r[option] = ETSCPareto(yte, labels.astype(int), scores, reduce=False, metric_list=('accuracy',)).metric().copy()\n", + " return r\n", + "\n", + "def plot_changes(result_metrics: dict, param_name='', height=3):\n", + " fig, axes = plt.subplots(1, len(result_metrics), figsize=(len(result_metrics) * height, height * 1.2))\n", + " for i, (param_val, values) in enumerate(result_metrics.items()):\n", + " n = len(values.accuracy)\n", + " earliness = np.round((1 - np.arange(n)/ n) * 100)\n", + " axes[i].plot(values.robustness, \n", + " values.accuracy, c='k', alpha=0.4)\n", + " scatter = axes[i].scatter(x=values.robustness, \n", + " y=values.accuracy,\n", + " c=earliness,\n", + " cmap='plasma'\n", + " )\n", + " axes[i].set_xlim((-0.05, 1.05))\n", + " axes[i].set_ylim((-0.05, 1.05))\n", + " axes[i].set_xticks(np.linspace(0, 1, 6))\n", + " axes[i].set_yticks(np.linspace(0, 1, 6))\n", + " axes[i].grid('all')\n", + " axes[i].set_title(f'{param_name} = {param_val}')\n", + " if i == 0: \n", + " legend1 = axes[i].legend(*scatter.legend_elements(alpha=0.6),\n", + " loc='best',\n", + " title=\"earliness, %\",\n", + " ncols=2,\n", + " borderaxespad=0\n", + " )\n", + " axes[i].add_artist(legend1)\n", + " \n", + " fig.supylabel('accuracy')\n", + " fig.supxlabel('robustness')\n", + " fig.tight_layout()\n", + "\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Probability Thresholding" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Probability Thresholding executes the simpliest mode of prediction:\n", + "\n", + "Firstly, the number of matching consecutive predictions is avaluated. If number of classifiers predicted the same label exceeds the specified *consecutive_predictions* parameter, the classification is done confidently. \n", + "\n", + "Otherwise the predicted probability is compared to the *probability_threshold*. And if it is not below it, the prediction is accepted." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from fedot_ind.core.models.early_tc import prob_threshold as PROB_THR\n", + "\n", + "cons_preds = [1, 3, 5, 7]\n", + "r_pthr = eval_param_influence(PROB_THR.ProbabilityThresholdClassifier,\n", + " 'consecutive_predictions', cons_preds, probability_threshold=0.8,\n", + " prediction_mode='all', interval_percentage=INTEVAL_PERCENTAGE) " + ] + }, + { + "cell_type": "code", + "execution_count": 199, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "plot_changes(r_pthr, param_name='consec_preds', height=3.5)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "As we may see on the plot above, the edge value of *consecutive_predictions* = 1 results in acceptance of all the prediction made. And main influence of this parameter is observed in the middle range of predictors. The accuracy of predictions doesn't sigificantly change, whereas the common trend is left shift resulting in lesser proportion of accepted labels." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Teaser " + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Another model exploiting the consecutive labels count is TEASER. But the way to prove acceptance of prediction is a bit more elaborate: instead of simple thresholding the evaluation mechanism is OneClass SVM which is trained for every prediction point on correct predictions. The features for their fitting are class probabilities with addition of most close proba differences for every prediction. " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from fedot_ind.core.models.early_tc import teaser as TEASER\n", + "\n", + "cons_preds = [1, 3, 5, 7]\n", + "r_teaser = eval_param_influence(TEASER.TEASER,\n", + " 'consecutive_predictions', cons_preds,\n", + " prediction_mode='all', interval_percentage=INTEVAL_PERCENTAGE)" + ] + }, + { + "cell_type": "code", + "execution_count": 200, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "plot_changes(r_teaser, param_name='cons_preds', height=4)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Here we see the same behavior on the first subplot. But in other cases model demonstrates the greater hesitation for the most early points. Further, the greater amount of consecutive predictions is required, the lefter point shift. So, one may conclude the OneClassSVM approach is not as stable as the thresholding is or the underfitting of classifiers is present." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### EconomyK" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "EconomyK algorithm widens the boundaries of basic classsifiers queue with the estimation of prefixes clustering results. Clustering is conducted with fast KMeans during the training phase and for prefixes the required length is cropped from centroids' coordinates. \n", + "\n", + "The accessed values of probability of being labeled as a cluster member is recalculated and used to ensure the slave prediction. " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "import fedot_ind.core.models.early_tc.economy_k as ECONOMYK\n", + "params = [1e-3, 1, 1e5, 1e7]\n", + "r_economy_k = eval_param_influence(ECONOMYK.EconomyK,\n", + " 'lambda_', params,\n", + " prediction_mode='all', interval_percentage=INTEVAL_PERCENTAGE)" + ] + }, + { + "cell_type": "code", + "execution_count": 201, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "plot_changes(r_economy_k, param_name='lambda', height=4)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Extremely interesting behaviour is registered for EconomyK model: its confidence rockets with the earliness drop resulting in acceptance of almost all the predictions, however, the resulting accuracy is not as large as it is expected for such level of confidence." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### ECEC" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The definition of a common confidence threshold for different classifiers lacks of logic since the ratio of available classes and features changes along the time series length and effect the classifiers' performances. ECEC model aims to eliminate this drawback evaluating the confidence thresholds separately and automatically. \n", + "\n", + "Obtained values are stored in *confidence_thresholds* attribute after training." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from fedot_ind.core.models.early_tc import ecec as ECEC\n", + "reload(ECEC)\n", + "accuracy_importance = [0, 0.1, 0.2, 1]\n", + "r_ecec = eval_param_influence(ECEC.ECEC,\n", + " 'accuracy_importance', accuracy_importance,\n", + " prediction_mode='all', interval_percentage=INTEVAL_PERCENTAGE)" + ] + }, + { + "cell_type": "code", + "execution_count": 202, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "plot_changes(r_ecec, param_name='accuracy_importance', height=4)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Surprisingly, ECEC demonstrates very subtle sensitivity to the only tunable fitting huperparameter *accuracy_importance* which results in a flattend values in case only aerliness is considered, and downsliding dependency for other values which may be an evidence of overestimation of parameters. \n", + "\n", + "Moreover, for last subplots, the first 5 estimation points are set to (0, 0) since no objects passed over the thresholds." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## API launch" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [], + "source": [ + "from fedot.core.pipelines.pipeline_builder import PipelineBuilder\n", + "from fedot_ind.core.repository.initializer_industrial_models import IndustrialModels\n", + "from copy import deepcopy\n", + "from tqdm.autonotebook import tqdm" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Let's prepare some configuration dictionaries" + ] + }, + { + "cell_type": "code", + "execution_count": 102, + "metadata": {}, + "outputs": [], + "source": [ + "series_length = train_data.features.shape[-1]\n", + "\n", + "interval_percentage = 5\n", + "consecutive_predictions = 2\n", + "transform_score = True\n", + "prediction_mode = 'all'\n", + "accuracy_importance = 0.5\n", + "common_dict = {\n", + " 'prediction_mode': prediction_mode,\n", + " 'interval_percentage': interval_percentage,\n", + " 'transform_score': transform_score,\n", + " 'accuracy_importance': accuracy_importance,\n", + "}\n", + "models = {\n", + " 'economy_k': {\n", + " 'lambda': 100000,\n", + " },\n", + " 'ecec': {},\n", + " 'teaser': {},\n", + " 'proba_threshold_etc': {\n", + " 'probability_threshold': 0.8,\n", + " },\n", + "}\n", + "for model in models:\n", + " models[model] |= common_dict\n", + "prediction_idx = (np.linspace(0, 1, 21) * series_length).astype(int)\n", + "earliness = 1 - prediction_idx / series_length\n", + "\n", + "results = {model: [None] * len(prediction_idx) for model in models}" + ] + }, + { + "cell_type": "code", + "execution_count": 128, + "metadata": {}, + "outputs": [], + "source": [ + "with IndustrialModels():\n", + " repo = IndustrialModels().setup_repository()\n", + " for model, params in models.items():\n", + " pipeline = PipelineBuilder().add_node(model, params=params).build()\n", + " pipeline.fit(train_data)\n", + " prediction = pipeline.predict(test_data).predict\n", + " prediction, scores = prediction\n", + " prediction = prediction.argmax(-1)\n", + " scores = scores[..., 0]\n", + " results[model] = ETSCPareto(\n", + " yte, prediction, scores, reduce=False, metric_list=('accuracy',).metric()\n", + " )\n" + ] + }, + { + "cell_type": "code", + "execution_count": 144, + "metadata": {}, + "outputs": [], + "source": [ + "import matplotlib.pyplot as plt\n", + "\n", + "def plot_bicrit_metric(metrics: dict, select=None):\n", + " plt.figure(figsize=(10, 10))\n", + " for model, metric in metrics.items():\n", + " selection = metric.iloc[select, :]\n", + " sizes = ((np.arange(selection.shape[0]) * 2)[::-1]) ** 1.5 + 10\n", + " plt.plot(selection.robustness, selection.accuracy, alpha=0.3)\n", + " plt.scatter(x=selection.robustness, \n", + " y=selection.accuracy,\n", + " s=sizes, \n", + " label=model)\n", + " plt.legend(loc=\"upper right\", bbox_to_anchor=(1.5, 1))\n", + " plt.xlabel('Robustness')\n", + " plt.ylabel('Accuracy')\n", + " plt.xlim((-0.05, 1.05))\n", + " plt.ylim((-0.05, 1.05))\n", + " plt.xticks(np.linspace(0, 1, 11))\n", + " plt.yticks(np.linspace(0, 1, 11))\n", + " plt.grid(True)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 145, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "plot_bicrit_metric(results, select=slice(None, None, 2))" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": ".venv", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.4" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/fedot_ind/core/metrics/interval_metrics.py b/fedot_ind/core/metrics/interval_metrics.py index f4a5f6544..d3436cdbb 100644 --- a/fedot_ind/core/metrics/interval_metrics.py +++ b/fedot_ind/core/metrics/interval_metrics.py @@ -134,5 +134,4 @@ def nab(boundaries, predictions, mode='standard', custom_coefs=None): score = np.inner([tps, len(confusion_matrix['FP']), len(confusion_matrix['FN'])], coefs) return score - - + \ No newline at end of file diff --git a/fedot_ind/core/metrics/metrics_implementation.py b/fedot_ind/core/metrics/metrics_implementation.py index 8803f18dd..dac5e888d 100644 --- a/fedot_ind/core/metrics/metrics_implementation.py +++ b/fedot_ind/core/metrics/metrics_implementation.py @@ -222,7 +222,7 @@ def smape(a, f, _=None): (np.abs(a) + np.abs(f)) * 100) def rmse(y_true, y_pred): - return np.sqrt(mean_squared_error(y_true, y_pred)) + return mean_squared_error(y_true, y_pred, squared=False) def mape(A, F): @@ -370,15 +370,22 @@ def metric(self) -> float: if len(self.predicted_labels.shape) == 1: self.predicted_labels = self.predicted_labels[None, ...] self.predicted_probs = self.predicted_probs[None, ...] - + print(f''' + target shape {self.target.shape} + prediction {self.predicted_labels.shape} + predicted_probs (scores) {self.predicted_probs.shape} + ''') n_metrics = len(self.metric_list) + (self.mode == 'robust') n_est = self.predicted_labels.shape[0] result = np.zeros((n_est, n_metrics)) + print(result.shape) if self.mode == 'robust': mask = self.predicted_probs >= 0 + print('mask', mask.shape) if not mask.any(): return result robustness = mask.sum(-1) / self.predicted_probs.shape[-1] + print('rob', robustness.shape) result[:, 0] = robustness.flatten() else: mask = np.ones_like(self.predicted_probs, dtype=bool) @@ -401,6 +408,7 @@ def metric(self) -> float: self.weights /= self.weights.sum() result = result @ self.weights.T + result[np.isnan(result)] = self.default_value if not self.reduce: return pd.DataFrame(result, columns=self.columns) else: diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index 9c8e12cb8..83c3a5bba 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -1,26 +1,40 @@ from typing import Optional, List -from fedot_ind.core.architecture.settings.computational import backend_methods as np +from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation +from fedot.core.operations.operation_parameters import OperationParameters from sklearn.preprocessing import StandardScaler from sklearn.base import ClassifierMixin, BaseEstimator from sktime.classification.dictionary_based import WEASEL -from fedot.core.operations.operation_parameters import OperationParameters +from fedot_ind.core.architecture.settings.computational import backend_methods as np + +class EarlyTSClassifier(ClassifierMixin, BaseEstimator): + """ + Base class for Early Time Series Classification models + which implement prefix-wise predictions via traiing multiple slave estimators. -class BaseETC(ClassifierMixin, BaseEstimator): - def __init__(self, params: Optional[OperationParameters] = None): - if params is None: - params = {} + Args: + ``interval_percentage (float in (1, 100])``: define how much points should be between prediction points. + ``consecutive_predictions (int)``: how many last subsequent estimators should classify object equally. + ``accuracy_importance (float in [0, 1])``: trade-off coefficient between earliness and accuracy. + ``prediction_mode (str in ['last_available', 'best_by_metrics_mean', 'all'])``: + - if 'last_available', returns the latest estimator prediction allowed by prefix length; + - if 'best_by_metrics_mean', returns the best of estimators estimated + with weighted average of accuracy and earliness + - if 'all', returns all estiamtors predictions + ``transform_score (bool)``: whether or not to scale scores to [-1, 1] interval + ``min_ts_step (int)``: minimal difference between to subsequent prefix' lengths + """ + def __init__(self, params: Optional[OperationParameters] = {}): super().__init__() self.interval_percentage = params.get('interval_percentage', 10) self.consecutive_predictions = params.get('consecutive_predictions', 1) self.accuracy_importance = params.get('accuracy_importance', 1.) - - self.prediction_mode = params.get('prediction_mode', 'last_available') - self.transform_score = params.get('transform_score', True) self.min_ts_length = params.get('min_ts_step', 3) self.random_state = params.get('random_state', None) + + self.prediction_mode = params.get('prediction_mode', 'last_available') + self.transform_score = params.get('transform_score', True) self.weasel_params = {} - assert self.consecutive_predictions < self.interval_percentage, 'Not enough checkpoints for prediction proof' def _init_model(self, X, y): max_data_length = X.shape[-1] @@ -69,7 +83,7 @@ def _compute_prediction_points(self, n_idx): def _select_estimators(self, X, training=False): offset = 0 - if not training and self.prediction_mode == 'best_by_harmonic_mean': + if not training and self.prediction_mode == 'best_by_metrics_mean': estimator_indices = [self._chosen_estimator_idx] elif not training and self.prediction_mode == 'last_available': last_idx, offset = self._get_applicable_index(X.shape[-1] - 1) @@ -100,6 +114,13 @@ def _consecutive_count(self, predicted_labels: List[np.array]): return consecutive_labels # prediction_points x n_instances def predict_proba(self, *args): + """ + Args: + X (np.array): input features + Returns: + predictions as a numpy array of shape (2, n_selected_estimators, n_instances, n_classes) + where first subarray stands for probas, and second for scores + """ predicted_probas, scores, *_ = args if self.transform_score: scores = self._transform_score(scores) @@ -110,6 +131,13 @@ def predict_proba(self, *args): return prediction def predict(self, X): + """ + Args: + X (np.array): input features + Returns: + predictions as a numpy array of shape (2, n_selected_estimators, n_instances) + where first subarray stands for labels, and second for scores + """ prediction = self.predict_proba(X) labels = prediction[0:1].argmax(-1) scores = prediction[1:2, ..., 0] diff --git a/fedot_ind/core/models/early_tc/ecec.py b/fedot_ind/core/models/early_tc/ecec.py index b83cc3254..64bb3f8bd 100644 --- a/fedot_ind/core/models/early_tc/ecec.py +++ b/fedot_ind/core/models/early_tc/ecec.py @@ -2,13 +2,18 @@ from fedot.core.operations.operation_parameters import OperationParameters from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.models.early_tc.base_early_tc import BaseETC +from fedot_ind.core.models.early_tc.base_early_tc import EarlyTSClassifier from sklearn.metrics import confusion_matrix from sklearn.model_selection import cross_val_predict -class ECEC(BaseETC): - def __init__(self, params: Optional[OperationParameters] = None): +class ECEC(EarlyTSClassifier): + """ + The Effective Confidence-based Early Classification algorithm + from J. Lv, X. Hu, L. Li, and P.-P. Li, “An effective confidence-based early classification + of time series,” IEEE Access, vol. 7, pp. 96 113–96 124, 2019 + """ + def __init__(self, params: Optional[OperationParameters] = {}): super().__init__(params) self.__cv = 5 @@ -53,6 +58,7 @@ def _score(self, y, y_pred, alpha): for i, candidate in enumerate(candidates): mask = confidences >= candidate # n_pred x n_inst accuracy_for_candidate = (matches * mask).sum(1) / mask.sum(1) # n_pred + accuracy_for_candidate[np.isnan(accuracy_for_candidate)] = 0 cfs[i] = self.cost_func(self.earliness, accuracy_for_candidate, alpha) self._chosen_estimator_idx = np.argmin(cfs.mean(0)) return candidates[np.argmin(cfs, axis=0)] # n_pred diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py index 481cad97b..675f87362 100644 --- a/fedot_ind/core/models/early_tc/economy_k.py +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -2,18 +2,22 @@ from fedot.core.operations.operation_parameters import OperationParameters from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.models.early_tc.base_early_tc import BaseETC +from fedot_ind.core.models.early_tc.base_early_tc import EarlyTSClassifier from sklearn.cluster import KMeans from sklearn.metrics import confusion_matrix from sklearn.model_selection import cross_val_predict -class EconomyK(BaseETC): - def __init__(self, params: Optional[OperationParameters] = None): - if params is None: - params = {} +class EconomyK(EarlyTSClassifier): + """ + Model described in + A. Dachraoui, A. Bondu, and A. Cornu´ejols, “Early classification of time series as a non myopic sequential decision + making problem,” in the European Conf. on Machine Learning and Knowledge Discovery in Databases, ser. LNCS, vol. + 9284. Springer, 2015, pp. 433–447. + """ + def __init__(self, params: Optional[OperationParameters] = {}): super().__init__(params) self.prediction_mode = params.get('prediction_mode', 'last_available') - self.lambda_ = params.get('lambda', 1.) + self.lambda_ = params.get('lambda_', 1.) self._cluster_factor = params.get('cluster_factor' , 1) self._random_state = 2104 self.__cv = 5 @@ -81,12 +85,11 @@ def predict_proba(self, X): return super().predict_proba(probas, times) def _transform_score(self, time): - idx = self._estimator_for_predict[-1] - scores = (1 - (time - self.prediction_idx[idx]) / self.prediction_idx[-1]) # [1 / n; 1 ] - 1 / n) * n /(n - 1) * 2 - 1 - n = self.n_pred - scores -= 1 / n - scores *= n / (n - 1) * 2 + scores = 1 - (time - self.prediction_idx[self._estimator_for_predict, None]) / (self.prediction_idx[-1] - self._estimator_for_predict)[:, None] + assert ((0 <= scores) & (scores <= 1)).all() + scores *= 2 scores -= 1 + scores[np.isnan(scores)] = 0 return scores diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index b72a927f1..946d4a2c2 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -2,12 +2,14 @@ from fedot.core.operations.operation_parameters import OperationParameters from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.models.early_tc.base_early_tc import BaseETC +from fedot_ind.core.models.early_tc.base_early_tc import EarlyTSClassifier -class ProbabilityThresholdClassifier(BaseETC): - def __init__(self, params: Optional[OperationParameters] = None): - if params is None: - params = {} +class ProbabilityThresholdClassifier(EarlyTSClassifier): + f""" + Two-tier Early time-series classification model + uniting consecutive prediction comparison and thresholding by predicted probability. + """ + def __init__(self, params: Optional[OperationParameters] = {}): super().__init__(params) self.probability_threshold = params.get('probability_threshold', None) @@ -15,11 +17,18 @@ def _init_model(self, X, y): super()._init_model(X, y) if self.probability_threshold is None: self.probability_threshold = 1 / len(self.classes_[0]) + eps = 1e-7 + if self.probability_threshold == 1: + self.probability_threshold -= eps + if self.probability_threshold == 0: + self.probability_threshold += eps def predict_proba(self, X): _, predicted_probas, non_acceptance = self._predict(X, training=False) - predicted_probas[non_acceptance] = 0 scores = predicted_probas.max(-1) + scores[~non_acceptance & (scores < self.probability_threshold)] = self.probability_threshold + \ + (1 - self.probability_threshold) * self.consecutive_predictions / self.n_pred + predicted_probas[non_acceptance] = 0 return super().predict_proba(predicted_probas, scores) def _predict(self, X, training=True): diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 0350d0886..8c44c0c2e 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -2,13 +2,20 @@ from fedot.core.operations.operation_parameters import OperationParameters from fedot_ind.core.architecture.settings.computational import backend_methods as np -from fedot_ind.core.models.early_tc.base_early_tc import BaseETC +from fedot_ind.core.models.early_tc.base_early_tc import EarlyTSClassifier from sklearn.model_selection import GridSearchCV from sklearn.svm import OneClassSVM -class TEASER(BaseETC): - def __init__(self, params: Optional[OperationParameters] = None): +class TEASER(EarlyTSClassifier): + """ + Two-tier Early and Accurate Series classifiER + + from “TEASER: early and accurate time series classification,” + Data Min. Knowl. Discov., vol. 34, no. 5, pp. 1336–1362, 2020 + """ + + def __init__(self, params: Optional[OperationParameters] = {}): super().__init__(params) self._oc_svm_params = (100., 10., 5., 2.5, 1.5, 1., 0.5, 0.25, 0.1) @@ -56,14 +63,27 @@ def _predict(self, X, training=False): final_verdict = self.oc_estimators[estimator_indices[i]].decision_function(X_to_ith) # mark as accepted final_verdicts[i] = final_verdict - non_acceptance[non_acceptance & (final_verdict > 0)] = False + (non_acceptance[non_acceptance & (final_verdict > 0)], + final_verdicts[non_acceptance], + final_verdicts[~non_acceptance & (final_verdicts < 0)] + ) = False, -1, self.consecutive_predictions / self.n_pred return predicted_labels, predicted_probas, non_acceptance, final_verdicts def predict_proba(self, X): _, predicted_probas, non_acceptance, final_verdicts = self._predict(X) - predicted_probas[non_acceptance] = final_verdicts[non_acceptance, None] + predicted_probas[non_acceptance] = 0 #final_verdicts[non_acceptance, None] return super().predict_proba(predicted_probas, final_verdicts) + def predict(self, X): + prediction = self.predict_proba(X) + labels = prediction[0:1].argmax(-1) + scores = prediction[1:2, ..., 0] + labels[scores < 0] = -1 + prediction = np.stack([labels, scores], 0) + if prediction.shape[1] == 1: + prediction = prediction.squeeze(1) + return prediction + def _score(self, X, y, accuracy_importance=None): scores = super()._score(X, y, accuracy_importance) self._chosen_estimator_idx = np.argmax(scores) diff --git a/fedot_ind/core/models/nn/network_impl/base_nn_model.py b/fedot_ind/core/models/nn/network_impl/base_nn_model.py index f285853d0..7c20f5f0b 100644 --- a/fedot_ind/core/models/nn/network_impl/base_nn_model.py +++ b/fedot_ind/core/models/nn/network_impl/base_nn_model.py @@ -122,8 +122,11 @@ def _train_one_batch(self, batch, optimizer, loss_fn): optimizer.step() training_loss = loss.data.item() * inputs.size(0) total = targets.size(0) - correct = (torch.argmax(output, 1) == - torch.argmax(targets, 1)).sum().item() + if targets.ndim == 2: + targets = targets.argmax(-1) + if output.ndim == 2: + output = output.argmax(-1) + correct = (output == targets).sum().item() return training_loss, total, correct def _eval_one_batch(self, batch, loss_fn): @@ -132,8 +135,11 @@ def _eval_one_batch(self, batch, loss_fn): loss = loss_fn(output, targets.float()) valid_loss = loss.data.item() * inputs.size(0) total = targets.size(0) - correct = (torch.argmax(output, 1) == - torch.argmax(targets, 1)).sum().item() + if targets.ndim == 2: + targets = targets.argmax(-1) + if output.ndim == 2: + output = output.argmax(-1) + correct = (output == targets).sum().item() return valid_loss, total, correct def _run_one_epoch(self, train_loader, val_loader, @@ -188,7 +194,6 @@ def _train_loop(self, train_loader, val_loader, loss_fn, optimizer): best_val_loss = float('inf') val_interval = self.get_validation_frequency( self.epochs, self.learning_rate) - loss_prefix = 'RMSE' if self.is_regression_task else 'Accuracy' for epoch in range(1, self.epochs + 1): best_model, best_val_loss = self._run_one_epoch( train_loader, val_loader, diff --git a/fedot_ind/core/models/nn/network_impl/mlstm.py b/fedot_ind/core/models/nn/network_impl/mlstm.py index 604f28660..33cf7e23e 100644 --- a/fedot_ind/core/models/nn/network_impl/mlstm.py +++ b/fedot_ind/core/models/nn/network_impl/mlstm.py @@ -1,20 +1,14 @@ -import copy from fedot_ind.core.models.nn.network_impl.base_nn_model import BaseNeuralModel -from typing import Optional, Callable, Any, List, Union +from typing import Optional from fedot.core.operations.operation_parameters import OperationParameters -from fedot.core.data.data import InputData, OutputData -from fedot_ind.core.repository.constanst_repository import CROSS_ENTROPY, MULTI_CLASS_CROSS_ENTROPY, RMSE +from fedot.core.data.data import InputData +from fedot_ind.core.repository.constanst_repository import CROSS_ENTROPY import torch.optim as optim -import torch.optim.lr_scheduler as lr_scheduler import torch.nn as nn import torch.nn.functional as F import torch -from tqdm import tqdm from fedot_ind.core.architecture.settings.computational import backend_methods as np from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array -import pandas as pd -from fedot_ind.core.models.nn.network_modules.layers.special import adjust_learning_rate, EarlyStopping -import torch.utils.data as data class SqueezeExciteBlock(nn.Module): def __init__(self, input_channels, filters, reduce=4): @@ -44,7 +38,7 @@ def __init__(self, input_size, input_channels, self.lstm = nn.LSTM(input_size, inner_size, num_layers, batch_first=True, dropout=dropout) - squeeze_excite_size = input_size #if not interval else interval + squeeze_excite_size = input_size self.conv_branch = nn.Sequential( nn.Conv1d(input_channels, inner_channels, padding='same', @@ -82,10 +76,15 @@ def forward(self, x, hidden_state=None, return_hidden=False): class MLSTM(BaseNeuralModel): - def __init__(self, params: Optional[OperationParameters] = None): - if params is None: - params = {} - super().__init__() + f""" + The Multivariate Long Short Term Memory Fully Convolutional Network (MLSTM) + from F. Karim, S. Majumdar, H. Darabi, and S. Harford, “Multivariate LSTM-FCNs for time series classification,” Neural + Networks, vol. 116, pp. 237–245, 2019. + + {BaseNeuralModel.__doc__} + """ + def __init__(self, params: Optional[OperationParameters] = {}): + super().__init__(params) self.dropout = params.get('dropout', 0.25) self.hidden_size = params.get('hidden_size', 64) self.hidden_channels = params.get('hidden_channels', 32) @@ -101,7 +100,7 @@ def __repr__(self): def _compute_prediction_points(self, n_idx): interval_length = max(int(n_idx * self.interval_percentage / 100), self.min_ts_length) prediction_idx = np.arange(interval_length - 1, n_idx, interval_length) - self.earliness = 1 - prediction_idx / n_idx # /n_idx because else the last hm score is always 0 + self.earliness = 1 - prediction_idx / n_idx return prediction_idx, interval_length def _init_model(self, ts: InputData): @@ -198,6 +197,7 @@ def _predict_model(self, x_test: InputData, output_mode: str = 'default'): pred = self._moving_window_output(torch.tensor(x_test).float()) else: raise ValueError('Unknown prediction mode') + pred = pred.detach() return self._convert_predict(pred, output_mode) def _padding(self, ts: np.array): diff --git a/fedot_ind/core/models/nn/network_impl/transformer.py b/fedot_ind/core/models/nn/network_impl/transformer.py index a8d12fdd8..07d049a33 100644 --- a/fedot_ind/core/models/nn/network_impl/transformer.py +++ b/fedot_ind/core/models/nn/network_impl/transformer.py @@ -72,6 +72,8 @@ class TransformerModel(BaseNeuralModel): self.batch_size: int, the batch size. """ + def __repr__(self): + return 'Transformer' def __init__(self, params: Optional[OperationParameters] = None): super().__init__(params) diff --git a/fedot_ind/core/models/quantile/quantile_extractor.py b/fedot_ind/core/models/quantile/quantile_extractor.py index 17a44e0cd..35fd99857 100644 --- a/fedot_ind/core/models/quantile/quantile_extractor.py +++ b/fedot_ind/core/models/quantile/quantile_extractor.py @@ -87,4 +87,4 @@ def generate_features_from_ts(self, aggregation_df = self._get_feature_matrix( self.extract_stats_features, ts) - return aggregation_df + return aggregation_df \ No newline at end of file diff --git a/fedot_ind/core/repository/data/industrial_model_repository.json b/fedot_ind/core/repository/data/industrial_model_repository.json index b05cb3c95..a7bddecf5 100644 --- a/fedot_ind/core/repository/data/industrial_model_repository.json +++ b/fedot_ind/core/repository/data/industrial_model_repository.json @@ -372,9 +372,9 @@ }, "mlstm_model": { "meta": "fedot_NN_classification", - "presets": ["ts"], + "presets": [], "tags": [], - "input_type": "[DataTypesEnum.table]" + "input_type": "[DataTypesEnum.multi_ts, DataTypesEnum.ts]" }, "xcm_model": { "meta": "fedot_NN_classification", diff --git a/tests/unit/core/models/model_impl/test_mlstm.py b/tests/unit/core/models/model_impl/test_mlstm.py new file mode 100644 index 000000000..d245e6dbd --- /dev/null +++ b/tests/unit/core/models/model_impl/test_mlstm.py @@ -0,0 +1,37 @@ +import pytest + +from fedot.core.data.data import InputData +from fedot_ind.core.models.nn.network_impl.mlstm import MLSTM +from fedot.core.pipelines.pipeline_builder import PipelineBuilder +from fedot_ind.core.repository.initializer_industrial_models import IndustrialModels +from fedot.core.repository.dataset_types import DataTypesEnum +from fedot.core.repository.tasks import Task, TaskTypesEnum +import numpy as np + + +_N_FEATURES = 73 +_N_SAMPLES = 133 +_N_CLASSES = 3 +_INTERVAL_LENGTH = 7 + +@pytest.fixture +def data(): + X, y = np.random.randn(_N_SAMPLES, _N_FEATURES), np.random.randint(0, _N_CLASSES, size=_N_SAMPLES) + return InputData(idx=np.arange(0, len(X)), + features=X, + target=y, + task=Task(TaskTypesEnum.classification), + data_type=DataTypesEnum.table) + +@pytest.mark.parametrize('fitting_mode', ['zero_padding', 'moving_window']) +def test_mlstm_by_mode(data, fitting_mode): + with IndustrialModels(): + ppl = PipelineBuilder().add_node('mlstm_model', + params={'epochs': 5, 'fitting_mode': fitting_mode}).build() + ppl.fit(data) + pred = ppl.predict(data).predict + assert not np.isnan(pred).any() + + + + diff --git a/tests/unit/core/models/test_etc.py b/tests/unit/core/models/test_etc.py new file mode 100644 index 000000000..b1ff2e3de --- /dev/null +++ b/tests/unit/core/models/test_etc.py @@ -0,0 +1,98 @@ +import pytest + +from fedot_ind.core.models.early_tc.prob_threshold import ProbabilityThresholdClassifier +from fedot_ind.core.models.early_tc.ecec import ECEC +from fedot_ind.core.models.early_tc.economy_k import EconomyK +from fedot_ind.core.models.early_tc.teaser import TEASER +import numpy as np + +_N_FEATURES = 73 +_N_SAMPLES = 133 +_N_CLASSES = 3 +_INTERVAL_LENGTH = 7 +MODELS = { + 'economy_k': EconomyK, + 'ecec': ECEC, + 'teaser': TEASER, + 'proba_threshold_etc': ProbabilityThresholdClassifier +} + +@pytest.fixture +def data(): + X, y = np.random.randn(_N_SAMPLES, _N_FEATURES), np.random.randint(0, _N_CLASSES, size=_N_SAMPLES) + return X, y + +def test_compute_prediction_points(data): + X, y = data + pthr = ProbabilityThresholdClassifier({'interval_percentage': 10}) + pthr._init_model(X, y) + prediction_idx = pthr.prediction_idx + assert len(prediction_idx) == _N_FEATURES // _INTERVAL_LENGTH, 'wrong number of points' + +@pytest.mark.parametrize('training,prediction_mode,expected_num', [ + (True, 'last_available', None), + (False, 'last_available', 1), + (False, 'best_by_metrics_mean', 1), + (False, 'all', None), + +]) +def test_select_estimators(data, training, prediction_mode, expected_num): + X, y = data + pthr = ProbabilityThresholdClassifier({'prediction_mode': prediction_mode}) + pthr._init_model(X, y) + if expected_num is None: + expected_num = pthr.n_pred + idx, _ = pthr._select_estimators(X, training) + assert len(idx) == expected_num, f'selection went wrong: got {len(idx)}, expected {expected_num}' + +@pytest.mark.parametrize('model', + ['proba_threshold_etc', 'ecec', 'economy_k', 'teaser']) +def test_fit_predict(data, model): + X, y = data + model = MODELS[model]({'prediction_mode': 'all'}) + model.fit(X, y) + prediction = model.predict_proba(X) + ind = model._select_estimators(X, training=False)[0] + assert (not np.isnan(prediction).any() and + (prediction.shape == (2, len(ind), len(y), _N_CLASSES))), 'Prediction went wrong' + +# ECEC TESTS +def test_select_thrs(): + model = ECEC() + selection = model._select_thrs(np.random.randn(40)) + assert len(selection), 'No candidates were chosen!' + +# Proba Thr +def test_consecutive(data): + X, y = data + pthr = ProbabilityThresholdClassifier({'prediction_mode': 'last_available', + 'consecutive_predictions': 1}) + pthr.fit(X, y) + prediction, scores = pthr.predict(X) + assert -1 not in prediction, 'Setting uncertainty while it is impossible' + +# Economy K +def test_specific_economyk(data): + X, y = data + model = EconomyK() + model.fit(X, y) + assert not np.isnan( + model._EconomyK__cluster_probas(X, model._clusterizer.cluster_centers_) + ).any(), '__cluster_probas doesn\'t function correctly' + + i = model.n_pred - 1 + times = model._get_prediction_time(X, model._clusterizer.cluster_centers_, i)[0] + assert not np.isnan(times).any() + assert ((model.prediction_idx[0] <= times) & (times <= model.prediction_idx[-1])).all(), \ + f'(_get_prediction_time) case of the last prediction point:' + \ + ' times cannot exceed the limits of time predictions.' + \ + f'current lies in [{times.min()}, {times.max()}]' + +# TEASER +def test_form_X_oc(): + probas = np.random.randint(0, 10, size=(_N_SAMPLES, _N_CLASSES)).astype(float) + probas /= probas.sum(1, keepdims=True) + 1e-5 + model = TEASER() + X_oc = model._form_X_oc(probas) + assert X_oc.shape == (_N_SAMPLES, _N_CLASSES + 1), 'Wrong number of features' + assert ((0 <= X_oc) & (X_oc <= 1)).all(), 'In original paper outputs lie in [0, 1]' From 3d9022c9da4fcba5d1006b16982ca6fd1a6455c6 Mon Sep 17 00:00:00 2001 From: autopep8 bot Date: Tue, 23 Jul 2024 09:41:01 +0000 Subject: [PATCH 39/43] Automated autopep8 fixes --- .../core/models/early_tc/base_early_tc.py | 10 +++--- fedot_ind/core/models/early_tc/ecec.py | 3 +- fedot_ind/core/models/early_tc/economy_k.py | 12 ++++--- .../core/models/early_tc/prob_threshold.py | 8 +++-- fedot_ind/core/models/early_tc/teaser.py | 14 ++++---- .../core/models/nn/network_impl/mlstm.py | 12 ++++--- .../models/nn/network_impl/transformer.py | 1 + .../models/quantile/quantile_extractor.py | 2 +- .../unit/core/models/model_impl/test_mlstm.py | 17 ++++------ tests/unit/core/models/test_etc.py | 34 +++++++++++++------ 10 files changed, 65 insertions(+), 48 deletions(-) diff --git a/fedot_ind/core/models/early_tc/base_early_tc.py b/fedot_ind/core/models/early_tc/base_early_tc.py index 09f24c462..bb5c9d89d 100644 --- a/fedot_ind/core/models/early_tc/base_early_tc.py +++ b/fedot_ind/core/models/early_tc/base_early_tc.py @@ -1,5 +1,4 @@ from typing import Optional, List -from fedot.core.operations.evaluation.operation_implementations.implementation_interfaces import ModelImplementation from fedot.core.operations.operation_parameters import OperationParameters from sklearn.preprocessing import StandardScaler from sklearn.base import ClassifierMixin, BaseEstimator @@ -9,7 +8,7 @@ class EarlyTSClassifier(ClassifierMixin, BaseEstimator): """ - Base class for Early Time Series Classification models + Base class for Early Time Series Classification models which implement prefix-wise predictions via traiing multiple slave estimators. Args: @@ -24,14 +23,15 @@ class EarlyTSClassifier(ClassifierMixin, BaseEstimator): ``transform_score (bool)``: whether or not to scale scores to [-1, 1] interval ``min_ts_step (int)``: minimal difference between to subsequent prefix' lengths """ - def __init__(self, params: Optional[OperationParameters] = {}): + + def __init__(self, params: Optional[OperationParameters] = {}): super().__init__() self.interval_percentage = params.get('interval_percentage', 10) self.consecutive_predictions = params.get('consecutive_predictions', 1) self.accuracy_importance = params.get('accuracy_importance', 1.) self.min_ts_length = params.get('min_ts_step', 3) self.random_state = params.get('random_state', None) - + self.prediction_mode = params.get('prediction_mode', 'last_available') self.transform_score = params.get('transform_score', True) self.weasel_params = {} @@ -123,7 +123,7 @@ def predict_proba(self, *args): predictions as a numpy array of shape (2, n_selected_estimators, n_instances, n_classes) where first subarray stands for probas, and second for scores """ - predicted_probas, scores, *_ = args + predicted_probas, scores, *_ = args if self.transform_score: scores = self._transform_score(scores) scores = np.tile(scores[..., None], (1, 1, self.n_classes)) diff --git a/fedot_ind/core/models/early_tc/ecec.py b/fedot_ind/core/models/early_tc/ecec.py index b8a743f25..4137faa70 100644 --- a/fedot_ind/core/models/early_tc/ecec.py +++ b/fedot_ind/core/models/early_tc/ecec.py @@ -13,6 +13,7 @@ class ECEC(EarlyTSClassifier): from J. Lv, X. Hu, L. Li, and P.-P. Li, “An effective confidence-based early classification of time series,” IEEE Access, vol. 7, pp. 96 113–96 124, 2019 """ + def __init__(self, params: Optional[OperationParameters] = {}): super().__init__(params) self.__cv = 5 @@ -57,7 +58,7 @@ def _score(self, y, y_pred, alpha): cfs = np.zeros((len(candidates), n)) for i, candidate in enumerate(candidates): mask = confidences >= candidate # n_pred x n_inst - accuracy_for_candidate = (matches * mask).sum(1) / mask.sum(1) # n_pred + accuracy_for_candidate = (matches * mask).sum(1) / mask.sum(1) # n_pred accuracy_for_candidate[np.isnan(accuracy_for_candidate)] = 0 cfs[i] = self.cost_func(self.earliness, accuracy_for_candidate, alpha) self._chosen_estimator_idx = np.argmin(cfs.mean(0)) diff --git a/fedot_ind/core/models/early_tc/economy_k.py b/fedot_ind/core/models/early_tc/economy_k.py index e41d393cf..a67d3b945 100644 --- a/fedot_ind/core/models/early_tc/economy_k.py +++ b/fedot_ind/core/models/early_tc/economy_k.py @@ -10,16 +10,17 @@ class EconomyK(EarlyTSClassifier): """ - Model described in - A. Dachraoui, A. Bondu, and A. Cornu´ejols, “Early classification of time series as a non myopic sequential decision + Model described in + A. Dachraoui, A. Bondu, and A. Cornu´ejols, “Early classification of time series as a non myopic sequential decision making problem,” in the European Conf. on Machine Learning and Knowledge Discovery in Databases, ser. LNCS, vol. 9284. Springer, 2015, pp. 433–447. """ - def __init__(self, params: Optional[OperationParameters] = {}): + + def __init__(self, params: Optional[OperationParameters] = {}): super().__init__(params) self.prediction_mode = params.get('prediction_mode', 'last_available') self.lambda_ = params.get('lambda_', 1.) - self._cluster_factor = params.get('cluster_factor' , 1) + self._cluster_factor = params.get('cluster_factor', 1) self._random_state = 2104 self.__cv = 5 @@ -88,7 +89,8 @@ def predict_proba(self, X): return super().predict_proba(probas, times) def _transform_score(self, time): - scores = 1 - (time - self.prediction_idx[self._estimator_for_predict, None]) / (self.prediction_idx[-1] - self._estimator_for_predict)[:, None] + scores = 1 - (time - self.prediction_idx[self._estimator_for_predict, None] + ) / (self.prediction_idx[-1] - self._estimator_for_predict)[:, None] assert ((0 <= scores) & (scores <= 1)).all() scores *= 2 scores -= 1 diff --git a/fedot_ind/core/models/early_tc/prob_threshold.py b/fedot_ind/core/models/early_tc/prob_threshold.py index 537bd963e..bbf77b49b 100644 --- a/fedot_ind/core/models/early_tc/prob_threshold.py +++ b/fedot_ind/core/models/early_tc/prob_threshold.py @@ -4,12 +4,14 @@ from fedot_ind.core.architecture.settings.computational import backend_methods as np from fedot_ind.core.models.early_tc.base_early_tc import EarlyTSClassifier + class ProbabilityThresholdClassifier(EarlyTSClassifier): f""" - Two-tier Early time-series classification model + Two-tier Early time-series classification model uniting consecutive prediction comparison and thresholding by predicted probability. """ - def __init__(self, params: Optional[OperationParameters] = {}): + + def __init__(self, params: Optional[OperationParameters] = {}): super().__init__(params) self.probability_threshold = params.get('probability_threshold', None) @@ -22,7 +24,7 @@ def _init_model(self, X, y): self.probability_threshold -= eps if self.probability_threshold == 0: self.probability_threshold += eps - + def predict_proba(self, X): _, predicted_probas, non_acceptance = self._predict(X, training=False) scores = predicted_probas.max(-1) diff --git a/fedot_ind/core/models/early_tc/teaser.py b/fedot_ind/core/models/early_tc/teaser.py index 5dd4ff437..475e8f33f 100644 --- a/fedot_ind/core/models/early_tc/teaser.py +++ b/fedot_ind/core/models/early_tc/teaser.py @@ -14,8 +14,8 @@ class TEASER(EarlyTSClassifier): from “TEASER: early and accurate time series classification,” Data Min. Knowl. Discov., vol. 34, no. 5, pp. 1336–1362, 2020 """ - - def __init__(self, params: Optional[OperationParameters] = {}): + + def __init__(self, params: Optional[OperationParameters] = {}): super().__init__(params) self._oc_svm_params = (100., 10., 5., 2.5, 1.5, 1., 0.5, 0.25, 0.1) @@ -62,16 +62,16 @@ def _predict(self, X, training=False): # if they are not outliers final_verdict = self.oc_estimators[estimator_indices[i]].decision_function(X_to_ith) # mark as accepted - final_verdicts[i] = final_verdict - (non_acceptance[non_acceptance & (final_verdict > 0)], - final_verdicts[non_acceptance], + final_verdicts[i] = final_verdict + (non_acceptance[non_acceptance & (final_verdict > 0)], + final_verdicts[non_acceptance], final_verdicts[~non_acceptance & (final_verdicts < 0)] - ) = False, -1, self.consecutive_predictions / self.n_pred + ) = False, -1, self.consecutive_predictions / self.n_pred return predicted_labels, predicted_probas, non_acceptance, final_verdicts def predict_proba(self, X): _, predicted_probas, non_acceptance, final_verdicts = self._predict(X) - predicted_probas[non_acceptance] = 0 #final_verdicts[non_acceptance, None] + predicted_probas[non_acceptance] = 0 # final_verdicts[non_acceptance, None] return super().predict_proba(predicted_probas, final_verdicts) def _score(self, X, y, accuracy_importance=None): diff --git a/fedot_ind/core/models/nn/network_impl/mlstm.py b/fedot_ind/core/models/nn/network_impl/mlstm.py index 2d9d99396..bc6b1e825 100644 --- a/fedot_ind/core/models/nn/network_impl/mlstm.py +++ b/fedot_ind/core/models/nn/network_impl/mlstm.py @@ -10,6 +10,7 @@ from fedot_ind.core.architecture.settings.computational import backend_methods as np from fedot_ind.core.architecture.abstraction.decorators import convert_to_3d_torch_array + class SqueezeExciteBlock(nn.Module): def __init__(self, input_channels, filters, reduce=4): super().__init__() @@ -37,9 +38,9 @@ def __init__(self, input_size, input_channels, super().__init__() self.proj = nn.Linear(input_size * inner_channels + input_channels * inner_size, output_size) self.lstm = nn.LSTM(input_size, inner_size, num_layers, - batch_first=True, dropout=dropout) - - squeeze_excite_size = input_size + batch_first=True, dropout=dropout) + + squeeze_excite_size = input_size self.conv_branch = nn.Sequential( nn.Conv1d(input_channels, inner_channels, padding='same', @@ -84,7 +85,8 @@ class MLSTM(BaseNeuralModel): {BaseNeuralModel.__doc__} """ - def __init__(self, params: Optional[OperationParameters] = {}): + + def __init__(self, params: Optional[OperationParameters] = {}): super().__init__(params) self.dropout = params.get('dropout', 0.25) self.hidden_size = params.get('hidden_size', 64) @@ -101,7 +103,7 @@ def __repr__(self): def _compute_prediction_points(self, n_idx): interval_length = max(int(n_idx * self.interval_percentage / 100), self.min_ts_length) prediction_idx = np.arange(interval_length - 1, n_idx, interval_length) - self.earliness = 1 - prediction_idx / n_idx + self.earliness = 1 - prediction_idx / n_idx return prediction_idx, interval_length def _init_model(self, ts: InputData): diff --git a/fedot_ind/core/models/nn/network_impl/transformer.py b/fedot_ind/core/models/nn/network_impl/transformer.py index 07d049a33..11dd54b09 100644 --- a/fedot_ind/core/models/nn/network_impl/transformer.py +++ b/fedot_ind/core/models/nn/network_impl/transformer.py @@ -72,6 +72,7 @@ class TransformerModel(BaseNeuralModel): self.batch_size: int, the batch size. """ + def __repr__(self): return 'Transformer' diff --git a/fedot_ind/core/models/quantile/quantile_extractor.py b/fedot_ind/core/models/quantile/quantile_extractor.py index 0d92127b6..596f165d6 100644 --- a/fedot_ind/core/models/quantile/quantile_extractor.py +++ b/fedot_ind/core/models/quantile/quantile_extractor.py @@ -90,4 +90,4 @@ def generate_features_from_ts(self, aggregation_df = self._get_feature_matrix( self.extract_stats_features, ts) - return aggregation_df \ No newline at end of file + return aggregation_df diff --git a/tests/unit/core/models/model_impl/test_mlstm.py b/tests/unit/core/models/model_impl/test_mlstm.py index d245e6dbd..be7fcc0ec 100644 --- a/tests/unit/core/models/model_impl/test_mlstm.py +++ b/tests/unit/core/models/model_impl/test_mlstm.py @@ -1,7 +1,6 @@ import pytest from fedot.core.data.data import InputData -from fedot_ind.core.models.nn.network_impl.mlstm import MLSTM from fedot.core.pipelines.pipeline_builder import PipelineBuilder from fedot_ind.core.repository.initializer_industrial_models import IndustrialModels from fedot.core.repository.dataset_types import DataTypesEnum @@ -14,24 +13,22 @@ _N_CLASSES = 3 _INTERVAL_LENGTH = 7 + @pytest.fixture def data(): X, y = np.random.randn(_N_SAMPLES, _N_FEATURES), np.random.randint(0, _N_CLASSES, size=_N_SAMPLES) return InputData(idx=np.arange(0, len(X)), - features=X, - target=y, - task=Task(TaskTypesEnum.classification), - data_type=DataTypesEnum.table) + features=X, + target=y, + task=Task(TaskTypesEnum.classification), + data_type=DataTypesEnum.table) + @pytest.mark.parametrize('fitting_mode', ['zero_padding', 'moving_window']) def test_mlstm_by_mode(data, fitting_mode): with IndustrialModels(): - ppl = PipelineBuilder().add_node('mlstm_model', + ppl = PipelineBuilder().add_node('mlstm_model', params={'epochs': 5, 'fitting_mode': fitting_mode}).build() ppl.fit(data) pred = ppl.predict(data).predict assert not np.isnan(pred).any() - - - - diff --git a/tests/unit/core/models/test_etc.py b/tests/unit/core/models/test_etc.py index b1ff2e3de..e8b0647eb 100644 --- a/tests/unit/core/models/test_etc.py +++ b/tests/unit/core/models/test_etc.py @@ -17,11 +17,13 @@ 'proba_threshold_etc': ProbabilityThresholdClassifier } + @pytest.fixture def data(): X, y = np.random.randn(_N_SAMPLES, _N_FEATURES), np.random.randint(0, _N_CLASSES, size=_N_SAMPLES) return X, y + def test_compute_prediction_points(data): X, y = data pthr = ProbabilityThresholdClassifier({'interval_percentage': 10}) @@ -29,12 +31,13 @@ def test_compute_prediction_points(data): prediction_idx = pthr.prediction_idx assert len(prediction_idx) == _N_FEATURES // _INTERVAL_LENGTH, 'wrong number of points' + @pytest.mark.parametrize('training,prediction_mode,expected_num', [ (True, 'last_available', None), - (False, 'last_available', 1), + (False, 'last_available', 1), (False, 'best_by_metrics_mean', 1), (False, 'all', None), - + ]) def test_select_estimators(data, training, prediction_mode, expected_num): X, y = data @@ -45,24 +48,29 @@ def test_select_estimators(data, training, prediction_mode, expected_num): idx, _ = pthr._select_estimators(X, training) assert len(idx) == expected_num, f'selection went wrong: got {len(idx)}, expected {expected_num}' -@pytest.mark.parametrize('model', - ['proba_threshold_etc', 'ecec', 'economy_k', 'teaser']) + +@pytest.mark.parametrize('model', + ['proba_threshold_etc', 'ecec', 'economy_k', 'teaser']) def test_fit_predict(data, model): X, y = data model = MODELS[model]({'prediction_mode': 'all'}) model.fit(X, y) prediction = model.predict_proba(X) ind = model._select_estimators(X, training=False)[0] - assert (not np.isnan(prediction).any() and + assert (not np.isnan(prediction).any() and (prediction.shape == (2, len(ind), len(y), _N_CLASSES))), 'Prediction went wrong' - + # ECEC TESTS + + def test_select_thrs(): model = ECEC() selection = model._select_thrs(np.random.randn(40)) assert len(selection), 'No candidates were chosen!' # Proba Thr + + def test_consecutive(data): X, y = data pthr = ProbabilityThresholdClassifier({'prediction_mode': 'last_available', @@ -72,23 +80,27 @@ def test_consecutive(data): assert -1 not in prediction, 'Setting uncertainty while it is impossible' # Economy K + + def test_specific_economyk(data): X, y = data model = EconomyK() model.fit(X, y) assert not np.isnan( model._EconomyK__cluster_probas(X, model._clusterizer.cluster_centers_) - ).any(), '__cluster_probas doesn\'t function correctly' - + ).any(), '__cluster_probas doesn\'t function correctly' + i = model.n_pred - 1 times = model._get_prediction_time(X, model._clusterizer.cluster_centers_, i)[0] assert not np.isnan(times).any() assert ((model.prediction_idx[0] <= times) & (times <= model.prediction_idx[-1])).all(), \ f'(_get_prediction_time) case of the last prediction point:' + \ - ' times cannot exceed the limits of time predictions.' + \ - f'current lies in [{times.min()}, {times.max()}]' - + ' times cannot exceed the limits of time predictions.' + \ + f'current lies in [{times.min()}, {times.max()}]' + # TEASER + + def test_form_X_oc(): probas = np.random.randint(0, 10, size=(_N_SAMPLES, _N_CLASSES)).astype(float) probas /= probas.sum(1, keepdims=True) + 1e-5 From e68331c4361adb119eb30f4955e39568f630d606 Mon Sep 17 00:00:00 2001 From: Leon_Strelkov <103892559+leostre@users.noreply.github.com> Date: Thu, 25 Jul 2024 12:24:09 +0300 Subject: [PATCH 40/43] Delete tests/unit/core/models/test_teaser.py due to its inclusion into test_etc.py --- tests/unit/core/models/test_teaser.py | 36 --------------------------- 1 file changed, 36 deletions(-) delete mode 100644 tests/unit/core/models/test_teaser.py diff --git a/tests/unit/core/models/test_teaser.py b/tests/unit/core/models/test_teaser.py deleted file mode 100644 index 1cf847f67..000000000 --- a/tests/unit/core/models/test_teaser.py +++ /dev/null @@ -1,36 +0,0 @@ -import pytest -import numpy as np -from fedot_ind.core.models.early_tc import teaser as TEASER - - -@pytest.fixture(scope='module') -def teaser(): - teaser = TEASER.TEASER({'interval_length': 10, 'prediction_mode': ''}) - return teaser - - -@pytest.fixture(scope='module') -def xy(): - return np.random.randn((2, 23)), np.random.randint(0, 2, size=(2, 1)) - - -def test_get_applicable_index(teaser): - teaser._init_model(23) - idx, offset = teaser._get_last_applicable_idx(100) - assert offset == 100 - 22, 'Wrong offset estimation when right edge' - assert idx == len(teaser.prediction_idx) - 1 - idx, offset = teaser._get_last_applicable_idx(12) - assert offset == 100 - teaser.prediction_idx[idx], 'Wrong offset estimation in the middle' - assert idx == len(teaser.prediction_idx) - 1 - - -def test_compute_prediction_points(teaser): - indices = teaser._compute_prediction_points(23) - assert 2 in indices - assert 22 in indices - assert 23 not in indices - -# def test_consecutive_count(teaser): -# pass - -# def test_score(teaser): From b50e8b133b07f498fd4784208d4fcf1340190c81 Mon Sep 17 00:00:00 2001 From: Leon_Strelkov <103892559+leostre@users.noreply.github.com> Date: Thu, 25 Jul 2024 12:46:22 +0300 Subject: [PATCH 41/43] Delete fedot_ind/core/metrics/interval_metrics.py due to the fucntionality overlap --- fedot_ind/core/metrics/interval_metrics.py | 142 --------------------- 1 file changed, 142 deletions(-) delete mode 100644 fedot_ind/core/metrics/interval_metrics.py diff --git a/fedot_ind/core/metrics/interval_metrics.py b/fedot_ind/core/metrics/interval_metrics.py deleted file mode 100644 index f95586147..000000000 --- a/fedot_ind/core/metrics/interval_metrics.py +++ /dev/null @@ -1,142 +0,0 @@ -from sklearn.metrics import confusion_matrix -import numpy as np -import pandas as pd -from typing import Union, Literal - - -def conf_matrix(actual, predicted): - cm = confusion_matrix(actual, predicted) - return dict(TN=cm[0, 0], FP=cm[0, 1], FN=cm[1, 0], TP=[1, 1]) - - -def average_delay(boundaries, prediction, - point, - use_idx=True, - window_placement='lefter'): - cp_confusion = extract_cp_cm(boundaries, prediction, use_idx=use_idx, use_switch_point=False) - # statistics - statistics = { - 'anomalies_num': len(cp_confusion['TPs']) + len(cp_confusion['FPs']), - 'FP_num': len(cp_confusion['FPs']), - 'missed': len(cp_confusion['FNs']) - } - time_func = { - 'righter': lambda triplet: triplet[1] - triplet[0], - 'lefter': lambda triplet: triplet[2] - triplet[1], - 'central': lambda triplet: triplet[1] - triplet[0] - (triplet[2] - triplet[0]) / 2 - }[window_placement] - - detection_history = { - i: time_func(triplet) for i, triplet in cp_confusion['TPs'].items() - } - return detection_history, statistics - - -def tp_transform(tps): - return np.diff(tps[[1, 0]], axis=0) / np.diff(tps[[-1, 0]], axis=0) - - -def extract_cp_cm(boundaries: Union[np.array, pd.DataFrame], - prediction: pd.DataFrame, - use_switch_point: bool = True, # if first anomaly dot is considered as changepoint - use_idx: bool = False): - if isinstance(boundaries, pd.DataFrame): - boundaries = boundaries.values.T - anomaly_tsp = prediction[prediction == 1].sort_index().index - TPs, FNs, FPs = {}, [], [] - - if boundaries.shape[1]: - - FPs += [anomaly_tsp[anomaly_tsp < boundaries[0, 0]]] # left rest - for i, (b_low, b_up) in enumerate(boundaries): - all_tsp_in_window = prediction[b_low: b_up].index - anomaly_tsp_in_window = anomaly_tsp_in_window & anomaly_tsp - if not len(anomaly_tsp_in_window): # why not false positive? do we expect an anomaly to be in every interval? - FNs.append(i if use_idx else all_tsp_in_window) - TPs[i] = [b_low, - anomaly_tsp_in_window[int(use_switch_point)] if use_idx else anomaly_tsp_in_window, - b_up] - if not use_idx: - FNs.append(all_tsp_in_window - anomaly_tsp_in_window) - FPs.append(anomaly_tsp[anomaly_tsp > boundaries[-1, -1]]) # right rest - else: - FPs.append(anomaly_tsp) - - FPs = np.concatenate(FPs) - FNs = np.concatenate(FNs) - - return dict( - FP=FPs, - FN=FNs, - TP=np.stack(TPs) - ) - -# cognate of single_detecting_boundaries - - -def get_boundaries(idx, actual_timestamps, window_size: int = None, - window_placement: Literal['left', 'right', 'central'] = 'left', - intersection_mode: Literal['uniform', 'shift_to_left', 'shift_to_right'] = 'shift_to_left', - ): - # idx = idx - # cast everything to pandas object fir the subsequent comfort - if isinstance(idx, np.array): - if idx.dtype == np.dtype('O'): - idx = pd.to_datetime(pd.Series(idx)) - td = pd.Timedelta(window_size) - else: - idx = pd.Series(idx) - td = window_size - else: - raise TypeError('Unexpected type of ts index') - - boundaries = np.tile(actual_timestamps, (2, 1)) - # [0, ...] - lower bound, [1, ...] - upper - if window_placement == 'left': - boundaries[0] -= td - elif window_placement == 'central': - boundaries[0] -= td / 2 - boundaries[1] += td / 2 - elif window_placement == 'right': - boundaries[1] += td - else: - raise ValueError('Unknown mode') - - if not len(actual_timestamps): - return boundaries - - # intersection resolution - for i in range(len(actual_timestamps) - 1): - if not boundaries[0, i + 1] > boundaries[1, i]: - continue - - if intersection_mode == 'shift_to_left': - boundaries[0, i + 1] = boundaries[1, i] - elif intersection_mode == 'shift_to_right': - boundaries[1, i] = boundaries[0, i + 1] - elif intersection_mode == 'uniform': - boundaries[1, i], boundaries[0, i + 1] = boundaries[0, i + 1], boundaries[1, i] - else: - raise ValueError('Unknown intersection resolution') - - # filtering - idx_to_keep = np.abs(np.diff(boundaries, axis=0)) > 1e-6 - boundaries = boundaries[..., idx_to_keep] - boundaries = pd.DataFrame({'lower': boundaries[0], 'upper': boundaries[1]}) - return boundaries - - -def nab(boundaries, predictions, mode='standard', custom_coefs=None): - inner_coefs = { - 'low_FP': [1.0, -0.11, -1.0], - 'standard': [1., -0.22, -1.], - 'lof_FN': [1., -0.11, -2.] - } - coefs = custom_coefs or inner_coefs[mode] - confusion_matrix = extract_cp_cm(boundaries, predictions) - - tps = confusion_matrix['tps'] - - score = np.inner([tps, len(confusion_matrix['FP']), len(confusion_matrix['FN'])], - coefs) - return score From c1ab5da891e7efc22d1fb68448c7329647e38269 Mon Sep 17 00:00:00 2001 From: Leon_Strelkov <103892559+leostre@users.noreply.github.com> Date: Thu, 25 Jul 2024 12:53:09 +0300 Subject: [PATCH 42/43] Apply suggestions from code review Co-authored-by: George Lopatenko <81328772+Lopa10ko@users.noreply.github.com> --- fedot_ind/core/models/quantile/quantile_extractor.py | 5 +---- fedot_ind/core/repository/model_repository.py | 4 ---- 2 files changed, 1 insertion(+), 8 deletions(-) diff --git a/fedot_ind/core/models/quantile/quantile_extractor.py b/fedot_ind/core/models/quantile/quantile_extractor.py index 596f165d6..17a44e0cd 100644 --- a/fedot_ind/core/models/quantile/quantile_extractor.py +++ b/fedot_ind/core/models/quantile/quantile_extractor.py @@ -42,10 +42,7 @@ def __init__(self, params: Optional[OperationParameters] = None): self.stride = params.get('stride', 1) self.add_global_features = params.get('add_global_features', True) self.logging_params.update({'Wsize': self.window_size, - 'Stride': self.stride, - # 'VarTh': self.var_threshold - } - ) + 'Stride': self.stride}) def _concatenate_global_and_local_feature( self, diff --git a/fedot_ind/core/repository/model_repository.py b/fedot_ind/core/repository/model_repository.py index b67df5d7c..c3e226dc7 100644 --- a/fedot_ind/core/repository/model_repository.py +++ b/fedot_ind/core/repository/model_repository.py @@ -37,10 +37,6 @@ from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor from xgboost import XGBRegressor -from fedot_ind.core.models.early_tc.ecec import ECEC -from fedot_ind.core.models.early_tc.economy_k import EconomyK -from fedot_ind.core.models.early_tc.prob_threshold import ProbabilityThresholdClassifier -from fedot_ind.core.models.early_tc.teaser import TEASER from fedot_ind.core.models.detection.anomaly.algorithms.arima_fault_detector import ARIMAFaultDetector from fedot_ind.core.models.detection.anomaly.algorithms.convolutional_autoencoder_detector import \ ConvolutionalAutoEncoderDetector From 916f89914691671b031c7f9492a9155908f70fba Mon Sep 17 00:00:00 2001 From: leostre Date: Fri, 26 Jul 2024 15:35:25 +0300 Subject: [PATCH 43/43] changed bump up fedot --- .github/workflows/poetry_unit_test.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/poetry_unit_test.yml b/.github/workflows/poetry_unit_test.yml index 2b3032116..b6b197b77 100644 --- a/.github/workflows/poetry_unit_test.yml +++ b/.github/workflows/poetry_unit_test.yml @@ -39,7 +39,7 @@ jobs: run: poetry install - name: Bump up FEDOT to a stable revision (temporary) - run: poetry add git+https://github.com/aimclub/FEDOT.git@e0b4ee7 + run: poetry add git+https://github.com/aimclub/FEDOT.git@master - name: Run tests with pytest run: poetry run pytest --cov=fedot_ind --cov-report xml:coverage.xml tests/unit