nasa · teubert · Oct 13, 2023 · Oct 11, 2023 · Oct 11, 2023 · Oct 13, 2023
diff --git a/.github/workflows/python-package.yml b/.github/workflows/python-package.yml
@@ -282,6 +282,24 @@ jobs:
  run: pip install --upgrade --upgrade-strategy eager -e .
  - name: Run tests
  run: python -m tests.test_loading
+ test_moe:
+ timeout-minutes: 5
+ runs-on: ubuntu-latest
+ steps:
+ - uses: actions/checkout@v3
+ - name: Set up Python
+ uses: actions/setup-python@v4
+ with:
+ python-version: '3.7'
+ - name: Install dependencies cache
+ uses: actions/cache@v2
+ with:
+ path: ~/.cache/pip
+ key: pip-cache
+ - name: Update
+ run: pip install --upgrade --upgrade-strategy eager -e .
+ - name: Run tests
+ run: python -m tests.test_moe
  test_pneumatic_valve:
  timeout-minutes: 5
  runs-on: ubuntu-latest

diff --git a/src/progpy/__init__.py b/src/progpy/__init__.py
@@ -5,6 +5,7 @@
 from progpy.prognostics_model import PrognosticsModel
 from progpy.ensemble_model import EnsembleModel
 from progpy.composite_model import CompositeModel
+from progpy.mixture_of_experts import MixtureOfExpertsModel
 from progpy.linear_model import LinearModel
 from progpy import predictors, state_estimators, uncertain_data
 

diff --git a/src/progpy/mixture_of_experts.py b/src/progpy/mixture_of_experts.py
@@ -0,0 +1,213 @@
+# Copyright © 2021 United States Government as represented by the Administrator of the
+# National Aeronautics and Space Administration. All Rights Reserved.
+
+import numpy as np
+
+from progpy import PrognosticsModel, CompositeModel
+
+DIVIDER = '.'
+
+
+class MixtureOfExpertsModel(CompositeModel):
+ """
+ .. versionadded:: 1.6.0
+
+ Mixture of Experts (MoE) models combine multiple models of the same system, similar to Ensemble models. Unlike Ensemble Models, the aggregation is done by selecting the "best" model. That is the model that has performed the best over the past.
+
+ The MoE model's inputs include the inputs and outputs of the individual models making up the model. If the output values are provided as an input to the model then the model will update the score during state tranisition. If not, state transition will continue as normal. Typically, outputs are provided in the MoE model input when performing a state estimation step but not when predicting forward.
+
+ Scores for the individual models is tracked in the state. At a state transition when outputs are provided, the score for the best model will increase by max_score_step for the best fitting model (i.e., lowest error in output) and decrease by max_score_step for the worst. All other models will be scaled between these, based on the error.
+
+ When calling output, event_state, threshold_met, or performance_metrics, only the model with the best score will be called, and those results returned. In case of a tie, the first model (in the order provided by the constructor) of the tied models will be used.
+
+ Args:
+ models (list[PrognosticsModel]): List of at least 2 models that form the ensemble
+
+ Keyword Args:
+ process_noise : Optional, float or dict[str, float]
+ :term:`Process noise<process noise>` (applied at dx/next_state). 
+ Can be number (e.g., .2) applied to every state, a dictionary of values for each 
+ state (e.g., {'x1': 0.2, 'x2': 0.3}), or a function (x) -> x
+ process_noise_dist : Optional, str
+ distribution for :term:`process noise` (e.g., normal, uniform, triangular)
+ measurement_noise : Optional, float or dict[str, float]
+ :term:`Measurement noise<measurement noise>` (applied in output eqn).
+ Can be number (e.g., .2) applied to every output, a dictionary of values for each
+ output (e.g., {'z1': 0.2, 'z2': 0.3}), or a function (z) -> z
+ measurement_noise_dist : Optional, str
+ distribution for :term:`measurement noise` (e.g., normal, uniform, triangular)
+ max_score_step : Optional, float
+ The maximum step in the score. This is the value by which the score of the best model increases, and the worst model decreases.
+ """
+
+ default_parameters = {
+ 'max_score_step': 0.01
+ }
+
+ def __init__(self, models: list, **kwargs):
+ # Run initializer in ComositeModel
+ # Note: Input validation is done there
+ super().__init__(models, **kwargs)
+
+ # Re-Initialize (overriding CompositeModel) for all except state
+ # This is because state will work like composite model, but all others will be more like ensemble model
+ self.inputs = set()
+ self.outputs = set()
+ self.events = set()
+ self.performance_metric_keys = set()
+
+ for (_, m) in self.parameters['models']:
+ self.inputs |= set(m.inputs)
+ self.outputs |= set(m.outputs)
+ self.events |= set(m.events)
+ self.performance_metric_keys |= set(m.performance_metric_keys)
+
+ self.inputs = list(self.inputs)
+ self.outputs = list(self.outputs)
+ self.states = list(self.states)
+ self.events = list(self.events)
+ self.performance_metric_keys = list(self.performance_metric_keys)
+
+ # Add last output to inputs
+ self.inputs.extend(self.outputs)
+
+ # Add model scores
+ self.states.extend([model[0] + DIVIDER + "_score" for model in self.parameters['models']])
+
+ # Finish initialization with prognostics model
+ # To reset statecontainer, etc.
+ # First reset noise (the double initialization doesnt work for that)
+ self.parameters = {key: value for key, value in self.parameters.items()} # Convert to dict
+ self.parameters['process_noise'] = kwargs.get('process_noise', 0)
+ self.parameters['measurement_noise'] = kwargs.get('process_noise', 0)
+ PrognosticsModel.__init__(self, **self.parameters)
+
+ def initialize(self, u={}, z={}):
+ if u is None:
+ u = {}
+ if z is None:
+ z = {}
+
+ # Initialize the models
+ x_0 = {}
+ for (name, m) in self.parameters['models']:
+ u_i = {key: u.get(name + DIVIDER + key, None) for key in m.inputs}
+ z_i = {key: z.get(name + DIVIDER + key, None) for key in m.outputs}
+ x_i = m.initialize(u_i, z_i)
+ for key, value in x_i.items():
+ x_0[name + DIVIDER + key] = value
+ x_0[name + DIVIDER + "_score"] = 0.5 # Initialize to half
+ return self.StateContainer(x_0)
+
+ def next_state(self, x, u, dt):
+
+ # Update state
+ for (name, m) in self.parameters['models']:
+ # Prepare inputs
+ u_i = {key: u.get(key, None) for key in m.inputs}
+ u_i = m.InputContainer(u_i)
+
+ # Prepare state
+ x_i = m.StateContainer({key: x[name + '.' + key] for key in m.states})
+
+ # Propagate state
+ x_next_i = m.next_state(x_i, u_i, dt)
+
+ # Save to super state
+ for key, value in x_next_i.items():
+ x[name + '.' + key] = value
+
+ # If z is not none - update score
+ if not np.any(np.isnan([u[key] for key in self.inputs])):
+ # If none in not u, that means that we have an updated output, so update the scores
+ # u excluded when there is not update
+ mses = []
+ # calculate mse on predicted output
+ for name, m in self.parameters['models']:
+ gt = [u[z_key] for z_key in m.outputs]
+ x_i = m.StateContainer({key: x[name + '.' + key] for key in m.states})
+ pred = [m.output(x_i)[z_key] for z_key in m.outputs]
+ mses.append(np.square(np.subtract(gt, pred)).mean())
+
+ min_mse = min(mses)
+ max_mse = max(mses)
+ diff_mse = max_mse-min_mse
+
+ # Score delta - +self.parameters['max_score_step'] for best, -self.parameters['max_score_step'] for worse
+ score_delta = [(min_mse-mse)/diff_mse*(2*self.parameters['max_score_step'])+self.parameters['max_score_step'] for mse in mses]
+ for i, (key, _) in enumerate(self.parameters['models']):
+ score_key = key + DIVIDER + "_score"
+ x[score_key] += score_delta[i]
+
+ # Apply lower limit
+ x[score_key] = np.maximum(x[score_key], 0)
+ # Note: lower limit saturation is acceptable
+
+ # Apply upper limit
+ if x[score_key] > 1:
+ x[score_key] -= score_delta[i] # undo application
+ # scale all to be <0.8
+ # This is needed to prevent one outlier bad model 
+ # From causing the other models to become saturated at 1
+ for j, (key_i, _) in enumerate(self.parameters['models']):
+ score_key_i = key_i + DIVIDER + "_score"
+ x[score_key_i] *= 0.8
+ # Also scale the 
+ score_delta[j] *= 0.8 # Also needs to be scaled
+
+ x[score_key] += score_delta[i] # Redo application
+
+ return x
+
+ def output(self, x):
+ # Identify best model
+ best_value = -1
+ for i, (key, _) in enumerate(self.parameters['models']):
+ score_key = key + DIVIDER + "_score"
+ if x[score_key] > best_value:
+ best_value = x[score_key]
+ best_index = i
+
+ # Prepare state
+ name, m = self.parameters['models'][best_index]
+ x_i = m.StateContainer({key: x[name + '.' + key] for key in m.states})
+ return m.output(x_i)
+
+ def event_state(self, x):
+ # Identify best model
+ best_value = -1
+ for i, (key, _) in enumerate(self.parameters['models']):
+ score_key = key + DIVIDER + "_score"
+ if x[score_key] > best_value:
+ best_value = x[score_key]
+ best_index = i
+
+ name, m = self.parameters['models'][best_index]
+ x_i = m.StateContainer({key: x[name + '.' + key] for key in m.states})
+ return m.event_state(x_i)
+
+ def threshold_met(self, x):
+ # Identify best model
+ best_value = -1
+ for i, (key, _) in enumerate(self.parameters['models']):
+ score_key = key + DIVIDER + "_score"
+ if x[score_key] > best_value:
+ best_value = x[score_key]
+ best_index = i
+
+ name, m = self.parameters['models'][best_index]
+ x_i = m.StateContainer({key: x[name + '.' + key] for key in m.states})
+ return m.threshold_met(x_i)
+
+ def performance_metrics(self, x):
+ # Identify best model
+ best_value = -1
+ for i, (key, _) in enumerate(self.parameters['models']):
+ score_key = key + DIVIDER + "_score"
+ if x[score_key] > best_value:
+ best_value = x[score_key]
+ best_index = i
+
+ name, m = self.parameters['models'][best_index]
+ x_i = m.StateContainer({key: x[name + '.' + key] for key in m.states})
+ return m.performance_metrics(x_i)
diff --git a/src/progpy/models/test_models/other_models.py b/src/progpy/models/test_models/other_models.py
@@ -0,0 +1,42 @@
+# Copyright © 2021 United States Government as represented by the Administrator of the National Aeronautics and Space Administration. All Rights Reserved.
+# This ensures that the directory containing examples is in the python search directories 
+
+from progpy import PrognosticsModel
+
+
+class OneInputTwoOutputsOneEvent(PrognosticsModel):
+ """
+ Simple example model where x0 increases by a * u0
+ """
+ inputs = ['u0']
+ states = ['x0']
+ outputs = ['x0+b', 'x0+c']
+ events = ['x0==10']
+
+ default_parameters = {
+ 'x0': { # Initial State
+ 'x0': 0
+ },
+ 'a': 1,
+ 'b': 1,
+ 'c': 1
+ }
+
+ def dx(self, x, u):
+ return self.StateContainer({
+ 'x0': self.parameters['a'] * u['u0']
+ })
+
+ def output(self, x):
+ return self.OutputContainer({
+ 'x0+b': x['x0'] + self.parameters['b'],
+ 'x0+c': x['x0'] + self.parameters['c']
+ })
+
+ def event_state(self, x):
+ return {
+ 'x0==10': 1-x['x0']/10
+ }
+
+ def threshold_met(self, x):
+ return {'x0==10': x['x0']>=10}
diff --git a/src/progpy/utils/parameters.py b/src/progpy/utils/parameters.py
@@ -150,8 +150,9 @@ def __setitem__(self, key: str, value: float, _copy: bool = False) -> None:
 
  # Make sure every key is present
  # (single value already handled above)
- if not all([key in self['process_noise'] for key in self._m.states]):
- raise ValueError("Process noise must have every key in model.states")
+ for key in self._m.states:
+ if key not in self['process_noise']:
+ self['process_noise'][key] = 0
 
  elif key == 'measurement_noise' or key == 'measurement_noise_dist':
  if callable(self['measurement_noise']):

diff --git a/tests/__main__.py b/tests/__main__.py
@@ -15,6 +15,7 @@
 from tests.test_linear_model import main as linear_main
 from tests.test_loading import main as loading_main
 from tests.test_metrics import main as metrics_main
+from tests.test_moe import main as moe_main
 from tests.test_pneumatic_valve import main as pneumatic_valve_main
 from tests.test_powertrain import main as powertrain_main
 from tests.test_predictors import main as pred_main
@@ -104,6 +105,11 @@
  except Exception:
  was_successful = False
 
+ try:
+ moe_main()
+ except Exception:
+ was_successful = False
+
  try:
  pneumatic_valve_main()
  except Exception: