idaholab · mandd · Jan 17, 2022 · Nov 16, 2021 · Nov 17, 2021 · Nov 18, 2021
diff --git a/doc/user_manual/generated/generateRomDoc.py b/doc/user_manual/generated/generateRomDoc.py
@@ -753,7 +753,8 @@
               'KerasMLPRegression',
               'KerasConvNetClassifier',
               'KerasLSTMClassifier',
-              'KerasLSTMRegression']
+              'KerasLSTMRegression'
+              ]
 validInternalRom = ['NDspline',
             'pickledROM',
             'GaussPolynomialRom',

diff --git a/doc/user_manual/generated/sklRom.tex b/doc/user_manual/generated/sklRom.tex
diff --git a/framework/Models/PostProcessors/LimitSurface.py b/framework/Models/PostProcessors/LimitSurface.py
@@ -131,7 +131,6 @@ def _initializeLSpp(self, runInfo, inputs, initDict):
       self.ROM.initializeModel(settings)
     else:
       self.ROM = self.assemblerDict['ROM'][0][3]
-    self.ROM.reset()
     self.indexes = -1
     for index, inp in enumerate(self.inputs):
       if mathUtils.isAString(inp)  or isinstance(inp, bytes):

diff --git a/framework/Models/ROM.py b/framework/Models/ROM.py
@@ -112,8 +112,8 @@ def __init__(self):
     self.printTag = 'ROM MODEL'           # label
     self.cvInstanceName = None            # the name of Cross Validation instance
     self.cvInstance = None                # Instance of provided cross validation
-    self._estimatorName = None            # the name of estimator instance
-    self._estimator = None                # Instance of provided estimator (ROM)
+    self._estimatorNameList = []          # the name list of estimator instance
+    self._estimatorList = []              # List of instances of provided estimators (ROM)
     self._interfaceROM = None             # Instance of provided ROM
 
     self.pickled = False # True if ROM comes from a pickled rom
@@ -133,7 +133,7 @@ def __init__(self):
     self.addAssemblerObject('Classifier', InputData.Quantity.zero_to_one)
     self.addAssemblerObject('Metric', InputData.Quantity.zero_to_infinity)
     self.addAssemblerObject('CV', InputData.Quantity.zero_to_one)
-    self.addAssemblerObject('estimator', InputData.Quantity.zero_to_one)
+    self.addAssemblerObject('estimator', InputData.Quantity.zero_to_infinity)
 
   def __getstate__(self):
     """
@@ -187,8 +187,8 @@ def _readMoreXML(self,xmlNode):
     cvNode = paramInput.findFirst('CV')
     if cvNode is not None:
       self.cvInstanceName = cvNode.value
-    estimatorNode = paramInput.findFirst('estimator')
-    self._estimatorName = estimatorNode.value if estimatorNode is not None else None
+    estimatorNodeList = paramInput.findAll('estimator')
+    self._estimatorNameList = [estimatorNode.value for estimatorNode in estimatorNodeList] if len(estimatorNodeList) > 0 else []
 
     self._interfaceROM = self.interfaceFactory.returnInstance(self.subType)
     segmentNode = paramInput.findFirst('Segment')
@@ -235,9 +235,9 @@ def initialize(self,runInfo,inputs,initDict=None):
       self.cvInstance.initialize(runInfo, inputs, initDict)
 
     # only initialize once
-    if self._estimator is None and self._estimatorName is not None:
-      self._estimator = self.retrieveObjectFromAssemblerDict('estimator', self._estimatorName)
-      self._interfaceROM.setEstimator(self._estimator)
+    if len(self._estimatorList) == 0 and len(self._estimatorNameList) > 0:
+      self._estimatorList = [self.retrieveObjectFromAssemblerDict('estimator', estimatorName) for estimatorName in self._estimatorNameList]
+      self._interfaceROM.setEstimator(self._estimatorList)
 
   def reset(self):
     """

diff --git a/framework/SupervisedLearning/Factory.py b/framework/SupervisedLearning/Factory.py
@@ -109,6 +109,12 @@
 from .ScikitLearn.Tree.DecisionTreeRegressor import DecisionTreeRegressor
 from .ScikitLearn.Tree.ExtraTreeClassifier import ExtraTreeClassifier
 from .ScikitLearn.Tree.ExtraTreeRegressor import ExtraTreeRegressor
+# Ensemble ROM for Regression
+from .ScikitLearn.Ensemble.VotingRegressor import VotingRegressor
+from .ScikitLearn.Ensemble.BaggingRegressor import BaggingRegressor
+from .ScikitLearn.Ensemble.AdaBoostRegressor import AdaBoostRegressor
+# require sklearn version 0.24 at least
+from .ScikitLearn.Ensemble.StackingRegressor import StackingRegressor
 ################################################################################
 
 factory = EntityFactory('SupervisedLearning')

diff --git a/framework/SupervisedLearning/ScikitLearn/DiscriminantAnalysis/LinearDiscriminantAnalysis.py b/framework/SupervisedLearning/ScikitLearn/DiscriminantAnalysis/LinearDiscriminantAnalysis.py
@@ -46,9 +46,7 @@ def __init__(self):
     super().__init__()
     import sklearn
     import sklearn.discriminant_analysis
-    import sklearn.multioutput
-    # we wrap the model with the multi output classifier (for multitarget)
-    self.model = sklearn.multioutput.MultiOutputClassifier(sklearn.discriminant_analysis.LinearDiscriminantAnalysis())
+    self.model = sklearn.discriminant_analysis.LinearDiscriminantAnalysis
 
   @classmethod
   def getInputSpecification(cls):

diff --git a/...work/SupervisedLearning/ScikitLearn/DiscriminantAnalysis/QuadraticDiscriminantAnalysis.py b/...work/SupervisedLearning/ScikitLearn/DiscriminantAnalysis/QuadraticDiscriminantAnalysis.py
@@ -47,9 +47,7 @@ def __init__(self):
     super().__init__()
     import sklearn
     import sklearn.discriminant_analysis
-    import sklearn.multioutput
-    # we wrap the model with the multi output classifier (for multitarget)
-    self.model = sklearn.multioutput.MultiOutputClassifier(sklearn.discriminant_analysis.QuadraticDiscriminantAnalysis())
+    self.model = sklearn.discriminant_analysis.QuadraticDiscriminantAnalysis
 
   @classmethod
   def getInputSpecification(cls):

diff --git a/framework/SupervisedLearning/ScikitLearn/Ensemble/AdaBoostRegressor.py b/framework/SupervisedLearning/ScikitLearn/Ensemble/AdaBoostRegressor.py
@@ -0,0 +1,121 @@
+# Copyright 2017 Battelle Energy Alliance, LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+  Created on Nov. 16, 2021
+
+  @author: wangc
+  AdaBoostRegressor
+  An AdaBoost regressors
+"""
+#Internal Modules (Lazy Importer)--------------------------------------------------------------------
+#Internal Modules (Lazy Importer) End----------------------------------------------------------------
+
+#External Modules------------------------------------------------------------------------------------
+#External Modules End--------------------------------------------------------------------------------
+
+#Internal Modules------------------------------------------------------------------------------------
+from SupervisedLearning.ScikitLearn import ScikitLearnBase
+from utils import InputData, InputTypes
+#Internal Modules End--------------------------------------------------------------------------------
+
+class AdaBoostRegressor(ScikitLearnBase):
+  """
+    An AdaBoost regressors
+  """
+  info = {'problemtype':'regression', 'normalize':False}
+
+  def __init__(self):
+    """
+      Constructor that will appropriately initialize a supervised learning object
+      @ In, None
+      @ Out, None
+    """
+    super().__init__()
+    self.multioutputWrapper = True
+    import sklearn
+    import sklearn.ensemble
+    self.model = sklearn.ensemble.AdaBoostRegressor
+
+  @classmethod
+  def getInputSpecification(cls):
+    """
+      Method to get a reference to a class that specifies the input data for
+      class cls.
+      @ In, cls, the class for which we are retrieving the specification
+      @ Out, inputSpecification, InputData.ParameterInput, class to use for
+        specifying input of cls.
+    """
+    specs = super().getInputSpecification()
+    specs.description = r"""The \xmlNode{AdaBoostRegressor} is a meta-estimator that begins by fitting a regressor on
+                            the original dataset and then fits additional copies of the regressor on the same dataset
+                            but where the weights of instances are adjusted according to the error of the current
+                            prediction. As such, subsequent regressors focus more on difficult cases.
+                         """
+    estimatorInput = InputData.assemblyInputFactory("estimator", contentType=InputTypes.StringType,
+                                                 descr=r"""name of a ROM that can be used as an estimator""", default='no-default')
+    specs.addSub(estimatorInput)
+    specs.addSub(InputData.parameterInputFactory("n_estimators", contentType=InputTypes.IntegerType,
+                                                 descr=r"""The maximum number of estimators at which boosting is
+                                                 terminated. In case of perfect fit, the learning procedure is
+                                                 stopped early.""", default=50))
+    specs.addSub(InputData.parameterInputFactory("learning_rate", contentType=InputTypes.FloatType,
+                                                 descr=r"""Weight applied to each regressor at each boosting iteration.
+                                                 A higher learning rate increases the contribution of each regressor.
+                                                 There is a trade-off between the learning\_rate and n\_estimators
+                                                 parameters.""", default=1.0))
+    specs.addSub(InputData.parameterInputFactory("loss", contentType=InputTypes.makeEnumType("loss", "lossType",['linear', 'square', 'exponential']),
+                                                 descr=r"""The loss function to use when updating the weights after each
+                                                 boosting iteration.""", default='linear'))
+    specs.addSub(InputData.parameterInputFactory("random_state", contentType=InputTypes.IntegerType,
+                                                 descr=r"""Controls the random seed given at each estimator at each
+                                                 boosting iteration.""", default=None))
+    return specs
+
+  def _handleInput(self, paramInput):
+    """
+      Function to handle the common parts of the distribution parameter input.
+      @ In, paramInput, ParameterInput, the already parsed input.
+      @ Out, None
+    """
+    super()._handleInput(paramInput)
+    settings, notFound = paramInput.findNodesAndExtractValues(['n_estimators', 'learning_rate', 'loss', 'random_state'])
+    # notFound must be empty
+    assert(not notFound)
+    self.settings = settings
+
+  def setEstimator(self, estimatorList):
+    """
+      Initialization method
+      @ In, estimatorList, list of ROM instances/estimators used by ROM
+      @ Out, None
+    """
+    super().setEstimator(estimatorList)
+    if len(estimatorList) != 1:
+      self.raiseAWarning('ROM', self.name, 'can only accept one estimator, but multiple estimators are provided!',
+                          'Only the first one will be used, i.e.,', estimator.name)
+    estimator = estimatorList[0]
+    interfaceRom = estimator._interfaceROM
+    if interfaceRom.info['problemtype'] != 'regression':
+      self.raiseAnError(IOError, 'estimator:', estimator.name, 'with problem type', interfaceRom.info['problemtype'],
+                        'can not be used for', self.name)
+    # In sklearn, multioutput wrapper can not be used by outer and inner estimator at the same time
+    # If the outer estimator can handle multioutput, the multioutput wrapper of inner can be kept,
+    # otherwise, we need to remove the wrapper for inner estimator.
+    if interfaceRom.multioutputWrapper:
+      sklEstimator = interfaceRom.model.get_params()['estimator']
+    else:
+      sklEstimator = interfaceRom.model
+    settings = {'base_estimator':sklEstimator}
+    self.settings.update(settings)
+    self.initializeModel(self.settings)
diff --git a/framework/SupervisedLearning/ScikitLearn/Ensemble/BaggingRegressor.py b/framework/SupervisedLearning/ScikitLearn/Ensemble/BaggingRegressor.py
@@ -0,0 +1,139 @@
+# Copyright 2017 Battelle Energy Alliance, LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+  Created on Nov. 22, 2021
+
+  @author: wangc
+  BaggingRegressor
+  A Bagging regressor.
+"""
+#Internal Modules (Lazy Importer)--------------------------------------------------------------------
+#Internal Modules (Lazy Importer) End----------------------------------------------------------------
+
+#External Modules------------------------------------------------------------------------------------
+#External Modules End--------------------------------------------------------------------------------
+
+#Internal Modules------------------------------------------------------------------------------------
+from SupervisedLearning.ScikitLearn import ScikitLearnBase
+from utils import InputData, InputTypes
+#Internal Modules End--------------------------------------------------------------------------------
+
+class BaggingRegressor(ScikitLearnBase):
+  """
+    A Bagging Regressor
+    A Bagging regressor is an ensemble meta-estimator that fits base regressors each on random subsets of the original
+    dataset and then aggregate their individual predictions (either by voting or by averaging) to form a final
+    prediction. Such a meta-estimator can typically be used as a way to reduce the variance of a black-box estimator
+    (e.g., a decision tree), by introducing randomization into its construction procedure and then making an ensemble
+    out of it.
+
+    This algorithm encompasses several works from the literature. When random subsets of the dataset are drawn as
+    random subsets of the samples, then this algorithm is known as Pasting. If samples are drawn with replacement,
+    then the method is known as Bagging. When random subsets of the dataset are drawn as random subsets of the
+    features, then the method is known as Random Subspaces. Finally, when base estimators are built on subsets of
+    both samples and features, then the method is known as Random Patches.
+  """
+  info = {'problemtype':'regression', 'normalize':False}
+
+  def __init__(self):
+    """
+      Constructor that will appropriately initialize a supervised learning object
+      @ In, None
+      @ Out, None
+    """
+    super().__init__()
+    self.multioutputWrapper = True
+    import sklearn
+    import sklearn.ensemble
+    self.model = sklearn.ensemble.BaggingRegressor
+
+  @classmethod
+  def getInputSpecification(cls):
+    """
+      Method to get a reference to a class that specifies the input data for
+      class cls.
+      @ In, cls, the class for which we are retrieving the specification
+      @ Out, inputSpecification, InputData.ParameterInput, class to use for
+        specifying input of cls.
+    """
+    specs = super().getInputSpecification()
+    specs.description = r"""The \xmlNode{BaggingRegressor} is an ensemble meta-estimator that fits base regressors each on random subsets of the original
+                            dataset and then aggregate their individual predictions (either by voting or by averaging) to form a final
+                            prediction. Such a meta-estimator can typically be used as a way to reduce the variance of a black-box estimator
+                            (e.g., a decision tree), by introducing randomization into its construction procedure and then making an ensemble
+                            out of it.
+                         """
+    estimatorInput = InputData.assemblyInputFactory("estimator", contentType=InputTypes.StringType,
+                                                 descr=r"""name of a ROM that can be used as an estimator""", default='no-default')
+    specs.addSub(estimatorInput)
+    specs.addSub(InputData.parameterInputFactory("n_estimators", contentType=InputTypes.IntegerType,
+                                                 descr=r"""The number of base estimators in the ensemble.""", default=10))
+    specs.addSub(InputData.parameterInputFactory("max_samples", contentType=InputTypes.FloatType,
+                                                 descr=r"""The number of samples to draw from X to train each base estimator""", default=1.0))
+    specs.addSub(InputData.parameterInputFactory("max_features", contentType=InputTypes.FloatType,
+                                                 descr=r"""The number of features to draw from X to train each base estimator """, default=1.0))
+    specs.addSub(InputData.parameterInputFactory("bootstrap", contentType=InputTypes.BoolType,
+                                                 descr=r"""Whether samples are drawn with replacement. If False, sampling without
+                                                 replacement is performed.""", default=True))
+    specs.addSub(InputData.parameterInputFactory("bootstrap_features", contentType=InputTypes.BoolType,
+                                                 descr=r"""Whether features are drawn with replacement.""", default=False))
+    specs.addSub(InputData.parameterInputFactory("oob_score", contentType=InputTypes.BoolType,
+                                                 descr=r"""Whether to use out-of-bag samples to estimate the generalization error.
+                                                 Only available if bootstrap=True.""", default=False))
+    specs.addSub(InputData.parameterInputFactory("warm_start", contentType=InputTypes.BoolType,
+                                                 descr=r"""When set to True, reuse the solution of the previous call to fit and add more
+                                                 estimators to the ensemble, otherwise, just fit a whole new ensemble.""", default=False))
+    specs.addSub(InputData.parameterInputFactory("random_state", contentType=InputTypes.IntegerType,
+                                                 descr=r"""Controls the random resampling of the original dataset (sample wise and feature wise). """,
+                                                 default=None))
+    return specs
+
+  def _handleInput(self, paramInput):
+    """
+      Function to handle the common parts of the distribution parameter input.
+      @ In, paramInput, ParameterInput, the already parsed input.
+      @ Out, None
+    """
+    super()._handleInput(paramInput)
+    settings, notFound = paramInput.findNodesAndExtractValues(['n_estimators', 'max_samples', 'max_features', 'bootstrap', 'bootstrap_features',
+                                    'oob_score', 'warm_start', 'random_state'])
+    # notFound must be empty
+    assert(not notFound)
+    self.settings = settings
+
+  def setEstimator(self, estimatorList):
+    """
+      Initialization method
+      @ In, estimatorList, list of ROM instances/estimators used by ROM
+      @ Out, None
+    """
+    super().setEstimator(estimatorList)
+    if len(estimatorList) != 1:
+      self.raiseAWarning('ROM', self.name, 'can only accept one estimator, but multiple estimators are provided!',
+                          'Only the first one will be used, i.e.,', estimator.name)
+    estimator = estimatorList[0]
+    interfaceRom = estimator._interfaceROM
+    if interfaceRom.info['problemtype'] != 'regression':
+      self.raiseAnError(IOError, 'estimator:', estimator.name, 'with problem type', interfaceRom.info['problemtype'],
+                        'can not be used for', self.name)
+    # In sklearn, multioutput wrapper can not be used by outer and inner estimator at the same time
+    # If the outer estimator can handle multioutput, the multioutput wrapper of inner can be kept,
+    # otherwise, we need to remove the wrapper for inner estimator.
+    if interfaceRom.multioutputWrapper:
+      sklEstimator = interfaceRom.model.get_params()['estimator']
+    else:
+      sklEstimator = interfaceRom.model
+    settings = {'base_estimator':sklEstimator}
+    self.settings.update(settings)
+    self.initializeModel(self.settings)