From 9b7d07d72c90c854908b90db89368c9c79793e4c Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Tue, 16 Jul 2024 15:56:46 +0200 Subject: [PATCH 01/25] Update readme. --- README.md | 39 +++++++++++---------------------------- 1 file changed, 11 insertions(+), 28 deletions(-) diff --git a/README.md b/README.md index 874e520df..033571ddb 100644 --- a/README.md +++ b/README.md @@ -12,39 +12,22 @@ [![image](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black) [![image](https://img.shields.io/badge/Contributor%20Covenant-2.1-4baaaa.svg)](CODE_OF_CONDUCT.md) [![image](https://pepy.tech/badge/estimagic/month)](https://pepy.tech/project/estimagic) +[![image](https://img.shields.io/badge/NumFOCUS-affiliated%20project-orange.svg?style=flat&colorA=E1523D&colorB=007D8A)](https://numfocus.org/sponsored-projects/affiliated-projects) +[![image](https://img.shields.io/twitter/follow/aiidateam.svg?style=social&label=Follow)](https://x.com/optimagic) ## Introduction -optimagic is a Python package for nonlinear optimization with or without constraints. It -is particularly suited to solve difficult nonlinear estimation problems. On top, it -provides functionality to perform statistical inference on estimated parameters. +*optimagic* is a Python package for numerical optimization. It is a unified interface to +optimizers from SciPy, NlOpt and many other Python packages. -### Optimization +*optimagic*'s `minimize` function works just like SciPy's, so you don't have to adjust +your code. You simply get more optimizers for free. On top you get powerful diagnostic +tools, parallel numerical derivatives and more. If you want to see what *optimagic* can +do, check out this [tutorial](tutorials/optimization_overview.ipynb) -- optimagic wraps algorithms from *scipy.optimize*, *nlopt*, *pygmo* and more. -- optimagic implements constraints efficiently via reparametrization, so you can solve - constrained problems with any optimizer that supports bounds. -- The parameters of an optimization problem can be arbitrary pytrees -- The complete history of parameters and function evaluations can be saved in a database - for maximum reproducibility. -- Painless and efficient multistart optimization. -- The progress of the optimization can be displayed in `criterion_plot` and - `params_plot` while the optimization is still running. - -### Estimation and Inference - -- You can estimate a model using method of simulated moments (MSM), calculate standard - errors and do sensitivity analysis with just one function call. -- Asymptotic standard errors for maximum likelihood estimation. -- estimagic also provides bootstrap confidence intervals and standard errors. Of course - the bootstrap procedures are parallelized. - -### Numerical differentiation - -- optimagic can calculate precise numerical derivatives using - [Richardson extrapolations](https://en.wikipedia.org/wiki/Richardson_extrapolation). -- Function evaluations needed for numerical derivatives can be done in parallel with - pre-implemented or user provided batch evaluators. +*optimagic* was formerly called *estimagic*, because it also provides functionality to +perform statistical inference on estimated parameters. *estimagic* is now a subpackage +of *optimagic*. ## Installation From 44a9e74ce90736d9d73680dc1ae41de2ce86b773 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Wed, 17 Jul 2024 08:23:48 +0200 Subject: [PATCH 02/25] Fix? --- .github/workflows/main.yml | 4 ++-- README.md | 3 +-- 2 files changed, 3 insertions(+), 4 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 592b7753d..2375428f3 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -120,9 +120,9 @@ jobs: strategy: fail-fast: false steps: - - uses: actions/checkout@v3 + - uses: actions/checkout@v4 - name: create build environment - uses: mamba-org/provision-with-micromamba@main + uses: mamba-org/setup-micromamba@v1 with: environment-file: ./.envs/testenv-linux.yml environment-name: optimagic diff --git a/README.md b/README.md index 033571ddb..8cffadd5d 100644 --- a/README.md +++ b/README.md @@ -22,8 +22,7 @@ optimizers from SciPy, NlOpt and many other Python packages. *optimagic*'s `minimize` function works just like SciPy's, so you don't have to adjust your code. You simply get more optimizers for free. On top you get powerful diagnostic -tools, parallel numerical derivatives and more. If you want to see what *optimagic* can -do, check out this [tutorial](tutorials/optimization_overview.ipynb) +tools, parallel numerical derivatives and more. *optimagic* was formerly called *estimagic*, because it also provides functionality to perform statistical inference on estimated parameters. *estimagic* is now a subpackage From 6a21d6effbf9eac4c2c869317c331bdc57c13057 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Wed, 17 Jul 2024 12:35:31 +0200 Subject: [PATCH 03/25] Add logos to readme. --- README.md | 11 +++++++++++ 1 file changed, 11 insertions(+) diff --git a/README.md b/README.md index 8cffadd5d..af35ebef2 100644 --- a/README.md +++ b/README.md @@ -83,3 +83,14 @@ If you use optimagic for your research, please do not forget to cite it. Url = {https://github.com/OpenSourceEconomics/optimagic} } ``` + +## Acknowledgements + +We thank all institutions that have funded or supported optimagic (formerly estimagic) + + + + + + + From c43df7de697b69a3582376919daeabdc138e88cb Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Wed, 17 Jul 2024 13:25:14 +0200 Subject: [PATCH 04/25] Basic renaming and deprecations. --- src/estimagic/estimate_ml.py | 4 +- src/optimagic/exceptions.py | 4 + src/optimagic/optimization/optimize.py | 581 +++++++----------- tests/optimagic/logging/test_read_log.py | 2 +- .../optimization/test_criterion_versions.py | 4 +- .../optimization/test_derivative_versions.py | 28 +- .../optimization/test_history_collection.py | 4 +- .../optimization/test_jax_derivatives.py | 20 +- .../optimization/test_many_algorithms.py | 6 +- .../optimagic/optimization/test_multistart.py | 24 +- .../test_optimizations_with_scaling.py | 4 +- tests/optimagic/optimization/test_optimize.py | 6 +- .../optimization/test_params_versions.py | 12 +- .../optimization/test_useful_exceptions.py | 12 +- .../test_with_advanced_constraints.py | 4 +- .../optimization/test_with_constraints.py | 18 +- .../test_with_nonlinear_constraints.py | 2 +- .../visualization/test_history_plots.py | 6 +- tests/test_deprecations.py | 2 +- 19 files changed, 300 insertions(+), 443 deletions(-) diff --git a/src/estimagic/estimate_ml.py b/src/estimagic/estimate_ml.py index 714ca76b0..a6b326ac9 100644 --- a/src/estimagic/estimate_ml.py +++ b/src/estimagic/estimate_ml.py @@ -166,8 +166,8 @@ def estimate_ml( opt_res = None else: opt_res = maximize( - criterion=loglike, - criterion_kwargs=loglike_kwargs, + fun=loglike, + fun_kwargs=loglike_kwargs, params=params, lower_bounds=lower_bounds, upper_bounds=upper_bounds, diff --git a/src/optimagic/exceptions.py b/src/optimagic/exceptions.py index 180b130ea..559a14532 100644 --- a/src/optimagic/exceptions.py +++ b/src/optimagic/exceptions.py @@ -23,6 +23,10 @@ class UserFunctionRuntimeError(OptimagicError): """Exception that is raised when user provided functions raise errors.""" +class MissingInputError(OptimagicError): + """Exception for missing user provided input.""" + + class InvalidKwargsError(OptimagicError): """Exception for invalid user provided keyword arguments.""" diff --git a/src/optimagic/optimization/optimize.py b/src/optimagic/optimization/optimize.py index a7bd9c5ca..1dcf8de81 100644 --- a/src/optimagic/optimization/optimize.py +++ b/src/optimagic/optimization/optimize.py @@ -3,7 +3,11 @@ from pathlib import Path from optimagic.batch_evaluators import process_batch_evaluator -from optimagic.exceptions import InvalidFunctionError, InvalidKwargsError +from optimagic.exceptions import ( + InvalidFunctionError, + InvalidKwargsError, + MissingInputError, +) from optimagic.logging.create_tables import ( make_optimization_iteration_table, make_optimization_problem_table, @@ -33,21 +37,21 @@ def maximize( - criterion, - params, - algorithm, + fun=None, + params=None, + algorithm=None, *, lower_bounds=None, upper_bounds=None, soft_lower_bounds=None, soft_upper_bounds=None, - criterion_kwargs=None, + fun_kwargs=None, constraints=None, algo_options=None, - derivative=None, - derivative_kwargs=None, - criterion_and_derivative=None, - criterion_and_derivative_kwargs=None, + jac=None, + jac_kwargs=None, + fun_and_jac=None, + fun_and_jac_kwargs=None, numdiff_options=None, logging=False, log_options=None, @@ -59,166 +63,31 @@ def maximize( multistart_options=None, collect_history=True, skip_checks=False, + # deprecated arguments + criterion=None, + criterion_kwargs=None, + derivative=None, + derivative_kwargs=None, + criterion_and_derivative=None, + criterion_and_derivative_kwargs=None, ): - """Maximize criterion using algorithm subject to constraints. - - Args: - criterion (callable): A function that takes a params as first argument and - returns a scalar (if only scalar algorithms will be used) or a dictionary - that contains at the entries "value" (a scalar float), "contributions" (a - pytree containing the summands that make up the criterion value) or - "root_contributions" (a pytree containing the residuals of a least-squares - problem) and any number of additional entries. The additional dict entries - will be stored in a database if logging is used. - params (pandas): A pytree containing the parameters with respect to which the - criterion is optimized. Examples are a numpy array, a pandas Series, - a DataFrame with "value" column, a float and any kind of (nested) dictionary - or list containing these elements. See :ref:`params` for examples. - algorithm (str or callable): Specifies the optimization algorithm. For built-in - algorithms this is a string with the name of the algorithm. Otherwise it can - be a callable with the optimagic algorithm interface. See :ref:`algorithms`. - lower_bounds (pytree): A pytree with the same structure as params with lower - bounds for the parameters. Can be ``-np.inf`` for parameters with no lower - bound. - upper_bounds (pytree): As lower_bounds. Can be ``np.inf`` for parameters with - no upper bound. - soft_lower_bounds (pytree): As lower bounds but the bounds are not imposed - during optimization and just used to sample start values if multistart - optimization is performed. - soft_upper_bounds (pytree): As soft_lower_bounds. - criterion_kwargs (dict): Additional keyword arguments for criterion - constraints (list, dict): List with constraint dictionaries or single dict. - See :ref:`constraints`. - algo_options (dict): Algorithm specific configuration of the optimization. See - :ref:`list_of_algorithms` for supported options of each algorithm. - derivative (callable): Function that calculates the first derivative - of criterion. For most algorithm, this is the gradient of the scalar - output (or "value" entry of the dict). However some algorithms (e.g. bhhh) - require the jacobian of the "contributions" entry of the dict. You will get - an error if you provide the wrong type of derivative. - derivative_kwargs (dict): Additional keyword arguments for derivative. - criterion_and_derivative (callable): Function that returns criterion - and derivative as a tuple. This can be used to exploit synergies in the - evaluation of both functions. The first element of the tuple has to be - exactly the same as the output of criterion. The second has to be exactly - the same as the output of derivative. - criterion_and_derivative_kwargs (dict): Additional keyword arguments for - criterion and derivative. - numdiff_options (dict): Keyword arguments for the calculation of numerical - derivatives. See :ref:`first_derivative` for details. Note that the default - method is changed to "forward" for speed reasons. - logging (pathlib.Path, str or False): Path to sqlite3 file (which typically has - the file extension ``.db``. If the file does not exist, it will be created. - When doing parallel optimizations and logging is provided, you have to - provide a different path for each optimization you are running. You can - disable logging completely by setting it to False, but we highly recommend - not to do so. - log_options (dict): Additional keyword arguments to configure the logging. - - "fast_logging": A boolean that determines if "unsafe" settings are used - to speed up write processes to the database. This should only be used for - very short running criterion functions where the main purpose of the log - is monitoring and it would not be catastrophic to get a - corrupted database in case of a sudden system shutdown. If one evaluation - of the criterion function (and gradient if applicable) takes more than - 100 ms, the logging overhead is negligible. - - "if_table_exists": (str) One of "extend", "replace", "raise". What to - do if the tables we want to write to already exist. Default "extend". - - "if_database_exists": (str): One of "extend", "replace", "raise". What to - do if the database we want to write to already exists. Default "extend". - error_handling (str): Either "raise" or "continue". Note that "continue" does - not absolutely guarantee that no error is raised but we try to handle as - many errors as possible in that case without aborting the optimization. - error_penalty (dict): Dict with the entries "constant" (float) and "slope" - (float). If the criterion or gradient raise an error and error_handling is - "continue", return ``constant + slope * norm(params - start_params)`` where - ``norm`` is the euclidean distance as criterion value and adjust the - derivative accordingly. This is meant to guide the optimizer back into a - valid region of parameter space (in direction of the start parameters). - Note that the constant has to be high enough to ensure that the penalty is - actually a bad function value. The default constant is f0 + abs(f0) + 100 - for minimizations and f0 - abs(f0) - 100 for maximizations, where - f0 is the criterion value at start parameters. The default slope is 0.1. - scaling (bool): If True, the parameter vector is rescaled internally for - better performance with scale sensitive optimizers. - scaling_options (dict or None): Options to configure the internal scaling ot - the parameter vector. See :ref:`scaling` for details and recommendations. - multistart (bool): Whether to do the optimization from multiple starting points. - Requires the params to have the columns ``"soft_lower_bound"`` and - ``"soft_upper_bounds"`` with finite values for all parameters, unless - the standard bounds are already finite for all parameters. - multistart_options (dict): Options to configure the optimization from multiple - starting values. The dictionary has the following entries - (all of which are optional): - - n_samples (int): Number of sampled points on which to do one function - evaluation. Default is 10 * n_params. - - sample (pandas.DataFrame or numpy.ndarray) A user definde sample. - If this is provided, n_samples, sampling_method and sampling_distribution - are not used. - - share_optimizations (float): Share of sampled points that is used to - construct a starting point for a local optimization. Default 0.1. - - sampling_distribution (str): One rof "uniform", "triangle". Default is - "uniform" as in the original tiktak algorithm. - - sampling_method (str): One of "random", "sobol", "halton", "hammersley", - "korobov", "latin_hypercube" or a numpy array or DataFrame with custom - points. Default is sobol for problems with up to 30 parameters and random - for problems with more than 30 parameters. - - mixing_weight_method (str or callable): Specifies how much weight is put - on the currently best point when calculating a new starting point for a - local optimization out of the currently best point and the next random - starting point. Either "tiktak" or "linear" or a callable that takes the - arguments ``iteration``, ``n_iterations``, ``min_weight``, ``max_weight``. - Default "tiktak". - - mixing_weight_bounds (tuple): A tuple consisting of a lower and upper - bound on mixing weights. Default (0.1, 0.995). - - convergence_max_discoveries (int): The multistart optimization converges - if the currently best local optimum has been discovered independently in - ``convergence_max_discoveries`` many local optimizations. Default 2. - - convergence.relative_params_tolerance (float): Determines the maximum - relative distance two parameter vectors can have to be considered equal - for convergence purposes. - - n_cores (int): Number cores used to evaluate the criterion function in - parallel during exploration stages and number of parallel local - optimization in optimization stages. Default 1. - - batch_evaluator (str or callable): See :ref:`batch_evaluators` for - details. Default "joblib". - - batch_size (int): If n_cores is larger than one, several starting points - for local optimizations are created with the same weight and from the same - currently best point. The ``batch_size`` argument is a way to reproduce - this behavior on a small machine where less cores are available. By - default the batch_size is equal to ``n_cores``. It can never be smaller - than ``n_cores``. - - seed (int): Random seed for the creation of starting values. Default None. - - exploration_error_handling (str): One of "raise" or "continue". Default - is continue, which means that failed function evaluations are simply - discarded from the sample. - - optimization_error_handling (str): One of "raise" or "continue". Default - is continue, which means that failed optimizations are simply discarded. - collect_history (bool): Whether the history of parameters and criterion values - should be collected and returned as part of the result. Default True. - skip_checks (bool): Whether checks on the inputs are skipped. This makes the - optimization faster, especially for very fast criterion functions. Default - False. - - Returns: - OptimizeResult: The optmization result. - - """ + """Maximize criterion using algorithm subject to constraints.""" return _optimize( direction="maximize", - criterion=criterion, + fun=fun, params=params, algorithm=algorithm, lower_bounds=lower_bounds, upper_bounds=upper_bounds, soft_lower_bounds=soft_lower_bounds, soft_upper_bounds=soft_upper_bounds, - criterion_kwargs=criterion_kwargs, + fun_kwargs=fun_kwargs, constraints=constraints, algo_options=algo_options, - derivative=derivative, - derivative_kwargs=derivative_kwargs, - criterion_and_derivative=criterion_and_derivative, - criterion_and_derivative_kwargs=criterion_and_derivative_kwargs, + jac=jac, + jac_kwargs=jac_kwargs, + fun_and_jac=fun_and_jac, + fun_and_jac_kwargs=fun_and_jac_kwargs, numdiff_options=numdiff_options, logging=logging, log_options=log_options, @@ -230,25 +99,32 @@ def maximize( multistart_options=multistart_options, collect_history=collect_history, skip_checks=skip_checks, + # deprecated arguments + criterion=criterion, + criterion_kwargs=criterion_kwargs, + derivative=derivative, + derivative_kwargs=derivative_kwargs, + criterion_and_derivative=criterion_and_derivative, + criterion_and_derivative_kwargs=criterion_and_derivative_kwargs, ) def minimize( - criterion, - params, - algorithm, + fun=None, + params=None, + algorithm=None, *, lower_bounds=None, upper_bounds=None, soft_lower_bounds=None, soft_upper_bounds=None, - criterion_kwargs=None, + fun_kwargs=None, constraints=None, algo_options=None, - derivative=None, - derivative_kwargs=None, - criterion_and_derivative=None, - criterion_and_derivative_kwargs=None, + jac=None, + jac_kwargs=None, + fun_and_jac=None, + fun_and_jac_kwargs=None, numdiff_options=None, logging=False, log_options=None, @@ -260,166 +136,32 @@ def minimize( multistart_options=None, collect_history=True, skip_checks=False, + # deprecated arguments + criterion=None, + criterion_kwargs=None, + derivative=None, + derivative_kwargs=None, + criterion_and_derivative=None, + criterion_and_derivative_kwargs=None, ): - """Minimize criterion using algorithm subject to constraints. - - Args: - criterion (callable): A function that takes a params as first argument and - returns a scalar (if only scalar algorithms will be used) or a dictionary - that contains at the entries "value" (a scalar float), "contributions" (a - pytree containing the summands that make up the criterion value) or - "root_contributions" (a pytree containing the residuals of a least-squares - problem) and any number of additional entries. The additional dict entries - will be stored in a database if logging is used. - params (pandas): A pytree containing the parameters with respect to which the - criterion is optimized. Examples are a numpy array, a pandas Series, - a DataFrame with "value" column, a float and any kind of (nested) dictionary - or list containing these elements. See :ref:`params` for examples. - algorithm (str or callable): Specifies the optimization algorithm. For built-in - algorithms this is a string with the name of the algorithm. Otherwise it can - be a callable with the optimagic algorithm interface. See :ref:`algorithms`. - lower_bounds (pytree): A pytree with the same structure as params with lower - bounds for the parameters. Can be ``-np.inf`` for parameters with no lower - bound. - upper_bounds (pytree): As lower_bounds. Can be ``np.inf`` for parameters with - no upper bound. - soft_lower_bounds (pytree): As lower bounds but the bounds are not imposed - during optimization and just used to sample start values if multistart - optimization is performed. - soft_upper_bounds (pytree): As soft_lower_bounds. - criterion_kwargs (dict): Additional keyword arguments for criterion - constraints (list, dict): List with constraint dictionaries or single dict. - See :ref:`constraints`. - algo_options (dict): Algorithm specific configuration of the optimization. See - :ref:`list_of_algorithms` for supported options of each algorithm. - derivative (callable): Function that calculates the first derivative - of criterion. For most algorithm, this is the gradient of the scalar - output (or "value" entry of the dict). However some algorithms (e.g. bhhh) - require the jacobian of the "contributions" entry of the dict. You will get - an error if you provide the wrong type of derivative. - derivative_kwargs (dict): Additional keyword arguments for derivative. - criterion_and_derivative (callable): Function that returns criterion - and derivative as a tuple. This can be used to exploit synergies in the - evaluation of both functions. The first element of the tuple has to be - exactly the same as the output of criterion. The second has to be exactly - the same as the output of derivative. - criterion_and_derivative_kwargs (dict): Additional keyword arguments for - criterion and derivative. - numdiff_options (dict): Keyword arguments for the calculation of numerical - derivatives. See :ref:`first_derivative` for details. Note that the default - method is changed to "forward" for speed reasons. - logging (pathlib.Path, str or False): Path to sqlite3 file (which typically has - the file extension ``.db``. If the file does not exist, it will be created. - When doing parallel optimizations and logging is provided, you have to - provide a different path for each optimization you are running. You can - disable logging completely by setting it to False, but we highly recommend - not to do so. - log_options (dict): Additional keyword arguments to configure the logging. - - "fast_logging": A boolean that determines if "unsafe" settings are used - to speed up write processes to the database. This should only be used for - very short running criterion functions where the main purpose of the log - is monitoring and it would not be catastrophic to get a - corrupted database in case of a sudden system shutdown. If one evaluation - of the criterion function (and gradient if applicable) takes more than - 100 ms, the logging overhead is negligible. - - "if_table_exists": (str) One of "extend", "replace", "raise". What to - do if the tables we want to write to already exist. Default "extend". - - "if_database_exists": (str): One of "extend", "replace", "raise". What to - do if the database we want to write to already exists. Default "extend". - error_handling (str): Either "raise" or "continue". Note that "continue" does - not absolutely guarantee that no error is raised but we try to handle as - many errors as possible in that case without aborting the optimization. - error_penalty (dict): Dict with the entries "constant" (float) and "slope" - (float). If the criterion or gradient raise an error and error_handling is - "continue", return ``constant + slope * norm(params - start_params)`` where - ``norm`` is the euclidean distance as criterion value and adjust the - derivative accordingly. This is meant to guide the optimizer back into a - valid region of parameter space (in direction of the start parameters). - Note that the constant has to be high enough to ensure that the penalty is - actually a bad function value. The default constant is f0 + abs(f0) + 100 - for minimizations and f0 - abs(f0) - 100 for maximizations, where - f0 is the criterion value at start parameters. The default slope is 0.1. - scaling (bool): If True, the parameter vector is rescaled internally for - better performance with scale sensitive optimizers. - scaling_options (dict or None): Options to configure the internal scaling ot - the parameter vector. See :ref:`scaling` for details and recommendations. - multistart (bool): Whether to do the optimization from multiple starting points. - Requires the params to have the columns ``"soft_lower_bound"`` and - ``"soft_upper_bounds"`` with finite values for all parameters, unless - the standard bounds are already finite for all parameters. - multistart_options (dict): Options to configure the optimization from multiple - starting values. The dictionary has the following entries - (all of which are optional): - - n_samples (int): Number of sampled points on which to do one function - evaluation. Default is 10 * n_params. - - sample (pandas.DataFrame or numpy.ndarray) A user definde sample. - If this is provided, n_samples, sampling_method and sampling_distribution - are not used. - - share_optimizations (float): Share of sampled points that is used to - construct a starting point for a local optimization. Default 0.1. - - sampling_distribution (str): One rof "uniform", "triangle". Default is - "uniform" as in the original tiktak algorithm. - - sampling_method (str): One of "random", "sobol", "halton", "hammersley", - "korobov", "latin_hypercube" or a numpy array or DataFrame with custom - points. Default is sobol for problems with up to 30 parameters and random - for problems with more than 30 parameters. - - mixing_weight_method (str or callable): Specifies how much weight is put - on the currently best point when calculating a new starting point for a - local optimization out of the currently best point and the next random - starting point. Either "tiktak" or "linear" or a callable that takes the - arguments ``iteration``, ``n_iterations``, ``min_weight``, ``max_weight``. - Default "tiktak". - - mixing_weight_bounds (tuple): A tuple consisting of a lower and upper - bound on mixing weights. Default (0.1, 0.995). - - convergence_max_discoveries (int): The multistart optimization converges - if the currently best local optimum has been discovered independently in - ``convergence_max_discoveries`` many local optimizations. Default 2. - - convergence.relative_params_tolerance (float): Determines the maximum - relative distance two parameter vectors can have to be considered equal - for convergence purposes. - - n_cores (int): Number cores used to evaluate the criterion function in - parallel during exploration stages and number of parallel local - optimization in optimization stages. Default 1. - - batch_evaluator (str or callable): See :ref:`batch_evaluators` for - details. Default "joblib". - - batch_size (int): If n_cores is larger than one, several starting points - for local optimizations are created with the same weight and from the same - currently best point. The ``batch_size`` argument is a way to reproduce - this behavior on a small machine where less cores are available. By - default the batch_size is equal to ``n_cores``. It can never be smaller - than ``n_cores``. - - seed (int): Random seed for the creation of starting values. Default None. - - exploration_error_handling (str): One of "raise" or "continue". Default - is continue, which means that failed function evaluations are simply - discarded from the sample. - - optimization_error_handling (str): One of "raise" or "continue". Default - is continue, which means that failed optimizations are simply discarded. - collect_history (bool): Whether the history of parameters and criterion values - should be collected and returned as part of the result. Default True. - skip_checks (bool): Whether checks on the inputs are skipped. This makes the - optimization faster, especially for very fast criterion functions. Default - False. - - Returns: - OptimizeResult: The optmization result. + """Minimize criterion using algorithm subject to constraints.""" - """ return _optimize( direction="minimize", - criterion=criterion, + fun=fun, params=params, algorithm=algorithm, lower_bounds=lower_bounds, upper_bounds=upper_bounds, soft_lower_bounds=soft_lower_bounds, soft_upper_bounds=soft_upper_bounds, - criterion_kwargs=criterion_kwargs, + fun_kwargs=fun_kwargs, constraints=constraints, algo_options=algo_options, - derivative=derivative, - derivative_kwargs=derivative_kwargs, - criterion_and_derivative=criterion_and_derivative, - criterion_and_derivative_kwargs=criterion_and_derivative_kwargs, + jac=jac, + jac_kwargs=jac_kwargs, + fun_and_jac=fun_and_jac, + fun_and_jac_kwargs=fun_and_jac_kwargs, numdiff_options=numdiff_options, logging=logging, log_options=log_options, @@ -431,26 +173,33 @@ def minimize( multistart_options=multistart_options, collect_history=collect_history, skip_checks=skip_checks, + # deprecated arguments + criterion=criterion, + criterion_kwargs=criterion_kwargs, + derivative=derivative, + derivative_kwargs=derivative_kwargs, + criterion_and_derivative=criterion_and_derivative, + criterion_and_derivative_kwargs=criterion_and_derivative_kwargs, ) def _optimize( direction, - criterion, + fun, params, algorithm, *, - lower_bounds=None, - upper_bounds=None, - soft_lower_bounds=None, - soft_upper_bounds=None, - criterion_kwargs, + lower_bounds, + upper_bounds, + soft_lower_bounds, + soft_upper_bounds, + fun_kwargs, constraints, algo_options, - derivative, - derivative_kwargs, - criterion_and_derivative, - criterion_and_derivative_kwargs, + jac, + jac_kwargs, + fun_and_jac, + fun_and_jac_kwargs, numdiff_options, logging, log_options, @@ -462,6 +211,13 @@ def _optimize( multistart_options, collect_history, skip_checks, + # deprecated arguments + criterion, + criterion_kwargs, + derivative, + derivative_kwargs, + criterion_and_derivative, + criterion_and_derivative_kwargs, ): """Minimize or maximize criterion using algorithm subject to constraints. @@ -471,14 +227,115 @@ def _optimize( Returns are the same as in maximize and minimize. """ + # ================================================================================== + # error handling needed as long as fun is an optional argument (i.e. until + # criterion is fully removed). + # ================================================================================== + + if fun is None and criterion is None: + msg = ( + "Missing objective function. Please provide an objective function as the " + "first positional argument or as the keyword argument `fun`." + ) + raise MissingInputError(msg) + + if params is None: + msg = ( + "Missing start parameters. Please provide start parameters as the second " + "positional argument or as the keyword argument `params`." + ) + raise MissingInputError(msg) + + if algorithm is None: + msg = ( + "Missing algorithm. Please provide an algorithm as the third positional " + "argument or as the keyword argument `algorithm`." + ) + raise MissingInputError(msg) + + # ================================================================================== + # deprecations + # ================================================================================== + + if criterion is not None: + msg = ( + "To align optimagic with scipy.optimize, the `criterion` argument has been " + "renamed to `fun`. Please use `fun` instead of `criterion`. Using " + "`criterion` will become an error in optimagic version 0.6.0 and later." + ) + warnings.warn(msg, DeprecationWarning) + + if fun is None: + fun = criterion + + if criterion_kwargs is not None: + msg = ( + "To align optimagic with scipy.optimize, the `criterion_kwargs` argument " + "has been renamed to `fun_kwargs`. Please use `fun_kwargs` instead of " + "`criterion_kwargs`. Using `criterion_kwargs` will become an error in " + "optimagic version 0.6.0 and later." + ) + warnings.warn(msg, DeprecationWarning) + + if fun_kwargs is None: + fun_kwargs = criterion_kwargs + + if derivative is not None: + msg = ( + "To align optimagic with scipy.optimize, the `derivative` argument has " + "been renamed to `jac`. Please use `jac` instead of `derivative`. Using " + "`derivative` will become an error in optimagic version 0.6.0 and later." + ) + warnings.warn(msg, DeprecationWarning) + + if jac is None: + jac = derivative + + if derivative_kwargs is not None: + msg = ( + "To align optimagic with scipy.optimize, the `derivative_kwargs` argument " + "has been renamed to `jac_kwargs`. Please use `jac_kwargs` instead of " + "`derivative_kwargs`. Using `derivative_kwargs` will become an error in " + "optimagic version 0.6.0 and later." + ) + warnings.warn(msg, DeprecationWarning) + + if jac_kwargs is None: + jac_kwargs = derivative_kwargs + + if criterion_and_derivative is not None: + msg = ( + "To align optimagic with scipy.optimize, the `criterion_and_derivative` " + "argument has been renamed to `fun_and_jac`. Please use `fun_and_jac` " + "instead of `criterion_and_derivative`. Using `criterion_and_derivative` " + "will become an error in optimagic version 0.6.0 and later." + ) + warnings.warn(msg, DeprecationWarning) + + if fun_and_jac is None: + fun_and_jac = criterion_and_derivative + + if criterion_and_derivative_kwargs is not None: + msg = ( + "To align optimagic with scipy.optimize, the " + "`criterion_and_derivative_kwargs` argument has been renamed to " + "`fun_and_jac_kwargs`. Please use `fun_and_jac_kwargs` instead of " + "`criterion_and_derivative_kwargs`. Using `criterion_and_derivative_kwargs`" + " will become an error in optimagic version 0.6.0 and later." + ) + warnings.warn(msg, DeprecationWarning) + + if fun_and_jac_kwargs is None: + fun_and_jac_kwargs = criterion_and_derivative_kwargs + # ================================================================================== # Set default values and check options # ================================================================================== - criterion_kwargs = _setdefault(criterion_kwargs, {}) + fun_kwargs = _setdefault(fun_kwargs, {}) constraints = _setdefault(constraints, []) algo_options = _setdefault(algo_options, {}) - derivative_kwargs = _setdefault(derivative_kwargs, {}) - criterion_and_derivative_kwargs = _setdefault(criterion_and_derivative_kwargs, {}) + jac_kwargs = _setdefault(jac_kwargs, {}) + fun_and_jac_kwargs = _setdefault(fun_and_jac_kwargs, {}) numdiff_options = _setdefault(numdiff_options, {}) log_options = _setdefault(log_options, {}) scaling_options = _setdefault(scaling_options, {}) @@ -490,16 +347,16 @@ def _optimize( if not skip_checks: check_optimize_kwargs( direction=direction, - criterion=criterion, - criterion_kwargs=criterion_kwargs, + criterion=fun, + criterion_kwargs=fun_kwargs, params=params, algorithm=algorithm, constraints=constraints, algo_options=algo_options, - derivative=derivative, - derivative_kwargs=derivative_kwargs, - criterion_and_derivative=criterion_and_derivative, - criterion_and_derivative_kwargs=criterion_and_derivative_kwargs, + derivative=jac, + derivative_kwargs=jac_kwargs, + criterion_and_derivative=fun_and_jac, + criterion_and_derivative_kwargs=fun_and_jac_kwargs, numdiff_options=numdiff_options, logging=logging, log_options=log_options, @@ -548,14 +405,14 @@ def _optimize( problem_data = { "direction": direction, # "criterion"-criterion, - "criterion_kwargs": criterion_kwargs, + "criterion_kwargs": fun_kwargs, "algorithm": algorithm, "constraints": constraints, "algo_options": algo_options, # "derivative"-derivative, - "derivative_kwargs": derivative_kwargs, + "derivative_kwargs": jac_kwargs, # "criterion_and_derivative"-criterion_and_derivative, - "criterion_and_derivative_kwargs": criterion_and_derivative_kwargs, + "criterion_and_derivative_kwargs": fun_and_jac_kwargs, "numdiff_options": numdiff_options, "log_options": log_options, "error_handling": error_handling, @@ -566,30 +423,28 @@ def _optimize( # ================================================================================== # partial the kwargs into corresponding functions # ================================================================================== - criterion = process_func_of_params( - func=criterion, - kwargs=criterion_kwargs, + fun = process_func_of_params( + func=fun, + kwargs=fun_kwargs, name="criterion", skip_checks=skip_checks, ) - if isinstance(derivative, dict): - derivative = derivative.get(algo_info.primary_criterion_entry) - if derivative is not None: - derivative = process_func_of_params( - func=derivative, - kwargs=derivative_kwargs, + if isinstance(jac, dict): + jac = jac.get(algo_info.primary_criterion_entry) + if jac is not None: + jac = process_func_of_params( + func=jac, + kwargs=jac_kwargs, name="derivative", skip_checks=skip_checks, ) - if isinstance(criterion_and_derivative, dict): - criterion_and_derivative = criterion_and_derivative.get( - algo_info.primary_criterion_entry - ) + if isinstance(fun_and_jac, dict): + fun_and_jac = fun_and_jac.get(algo_info.primary_criterion_entry) - if criterion_and_derivative is not None: - criterion_and_derivative = process_func_of_params( - func=criterion_and_derivative, - kwargs=criterion_and_derivative_kwargs, + if fun_and_jac is not None: + fun_and_jac = process_func_of_params( + func=fun_and_jac, + kwargs=fun_and_jac_kwargs, name="criterion_and_derivative", skip_checks=skip_checks, ) @@ -598,7 +453,7 @@ def _optimize( # Do first evaluation of user provided functions # ================================================================================== try: - first_crit_eval = criterion(params) + first_crit_eval = fun(params) except (KeyboardInterrupt, SystemExit): raise except Exception as e: @@ -606,27 +461,27 @@ def _optimize( raise InvalidFunctionError(msg) from e # do first derivative evaluation (if given) - if derivative is not None: + if jac is not None: try: - first_deriv_eval = derivative(params) + first_deriv_eval = jac(params) except (KeyboardInterrupt, SystemExit): raise except Exception as e: msg = "Error while evaluating derivative at start params." raise InvalidFunctionError(msg) from e - if criterion_and_derivative is not None: + if fun_and_jac is not None: try: - first_crit_and_deriv_eval = criterion_and_derivative(params) + first_crit_and_deriv_eval = fun_and_jac(params) except (KeyboardInterrupt, SystemExit): raise except Exception as e: msg = "Error while evaluating criterion_and_derivative at start params." raise InvalidFunctionError(msg) from e - if derivative is not None: + if jac is not None: used_deriv = first_deriv_eval - elif criterion_and_derivative is not None: + elif fun_and_jac is not None: used_deriv = first_crit_and_deriv_eval[1] else: used_deriv = None @@ -714,10 +569,10 @@ def _optimize( # ================================================================================== to_partial = { "direction": direction, - "criterion": criterion, + "criterion": fun, "converter": converter, - "derivative": derivative, - "criterion_and_derivative": criterion_and_derivative, + "derivative": jac, + "criterion_and_derivative": fun_and_jac, "numdiff_options": numdiff_options, "logging": logging, "database": database, diff --git a/tests/optimagic/logging/test_read_log.py b/tests/optimagic/logging/test_read_log.py index a030675a1..4b6c890c7 100644 --- a/tests/optimagic/logging/test_read_log.py +++ b/tests/optimagic/logging/test_read_log.py @@ -21,7 +21,7 @@ def _crit(params): return x @ x minimize( - criterion=_crit, + fun=_crit, params={"a": 1, "b": 2, "c": 3}, algorithm="scipy_lbfgsb", logging=path, diff --git a/tests/optimagic/optimization/test_criterion_versions.py b/tests/optimagic/optimization/test_criterion_versions.py index e111c84d2..d04d05f64 100644 --- a/tests/optimagic/optimization/test_criterion_versions.py +++ b/tests/optimagic/optimization/test_criterion_versions.py @@ -49,7 +49,7 @@ def test_valid_criterion_versions(criterion, algorithm): start_params = pd.DataFrame() start_params["value"] = [1, 2, 3] res = minimize( - criterion=criterion, + fun=criterion, params=start_params, algorithm=algorithm, ) @@ -64,7 +64,7 @@ def test_invalid_criterion_versions(criterion, algorithm): with pytest.raises(InvalidFunctionError): minimize( - criterion=criterion, + fun=criterion, params=start_params, algorithm=algorithm, ) diff --git a/tests/optimagic/optimization/test_derivative_versions.py b/tests/optimagic/optimization/test_derivative_versions.py index 5f13173c9..e84595c99 100644 --- a/tests/optimagic/optimization/test_derivative_versions.py +++ b/tests/optimagic/optimization/test_derivative_versions.py @@ -69,11 +69,11 @@ def test_valid_derivative_versions( if direction == "minimize": res = minimize( - criterion=sos_dict_criterion, + fun=sos_dict_criterion, params=start_params, algorithm=algorithm, - derivative=derivative, - criterion_and_derivative=criterion_and_derivative, + jac=derivative, + fun_and_jac=criterion_and_derivative, error_handling="raise", ) else: @@ -84,11 +84,11 @@ def test_valid_derivative_versions( else switch_sign(criterion_and_derivative) ) res = maximize( - criterion=switch_sign(sos_dict_criterion), + fun=switch_sign(sos_dict_criterion), params=start_params, algorithm=algorithm, - derivative=deriv, - criterion_and_derivative=crit_and_deriv, + jac=deriv, + fun_and_jac=crit_and_deriv, error_handling="raise", ) @@ -107,11 +107,11 @@ def test_invalid_derivative_versions( if direction == "minimize": with pytest.raises(ValueError): minimize( - criterion=sos_dict_criterion, + fun=sos_dict_criterion, params=start_params, algorithm=algorithm, - derivative=derivative, - criterion_and_derivative=criterion_and_derivative, + jac=derivative, + fun_and_jac=criterion_and_derivative, ) else: deriv = derivative if derivative is None else switch_sign(derivative) @@ -122,11 +122,11 @@ def test_invalid_derivative_versions( ) with pytest.raises(ValueError): maximize( - criterion=switch_sign(sos_dict_criterion), + fun=switch_sign(sos_dict_criterion), params=start_params, algorithm=algorithm, - derivative=deriv, - criterion_and_derivative=crit_and_deriv, + jac=deriv, + fun_and_jac=crit_and_deriv, ) @@ -135,10 +135,10 @@ def test_dict_derivative(): start_params["value"] = [1, 2, 3] res = minimize( - criterion=sos_dict_criterion, + fun=sos_dict_criterion, params=start_params, algorithm="scipy_lbfgsb", - derivative=sos_dict_derivative, + jac=sos_dict_derivative, ) aaae(res.params["value"].to_numpy(), np.zeros(3)) diff --git a/tests/optimagic/optimization/test_history_collection.py b/tests/optimagic/optimization/test_history_collection.py index f77d3620e..51381b12a 100644 --- a/tests/optimagic/optimization/test_history_collection.py +++ b/tests/optimagic/optimization/test_history_collection.py @@ -29,7 +29,7 @@ def test_history_collection_with_parallelization(algorithm, tmp_path): logging = tmp_path / "log.db" collected_hist = minimize( - criterion=lambda x: {"root_contributions": x, "value": x @ x}, + fun=lambda x: {"root_contributions": x, "value": x @ x}, params=np.arange(5), algorithm=algorithm, lower_bounds=lb, @@ -112,7 +112,7 @@ def test_history_collection_with_dummy_optimizer(n_cores, batch_size): } res = minimize( - criterion=_fake_criterion, + fun=_fake_criterion, params=np.arange(5), algorithm=_dummy_optimizer, algo_options=options, diff --git a/tests/optimagic/optimization/test_jax_derivatives.py b/tests/optimagic/optimization/test_jax_derivatives.py index fd8c043a4..15c77d250 100644 --- a/tests/optimagic/optimization/test_jax_derivatives.py +++ b/tests/optimagic/optimization/test_jax_derivatives.py @@ -26,8 +26,8 @@ def criterion(x): gradient = jax.grad(criterion) res = minimize( - criterion=criterion, - derivative=gradient, + fun=criterion, + jac=gradient, params=start_params, algorithm="scipy_lbfgsb", ) @@ -44,10 +44,10 @@ def criterion(x): return x**2 res = minimize( - criterion=criterion, + fun=criterion, params=jnp.array(1.0), algorithm="scipy_lbfgsb", - derivative=jax.grad(criterion), + jac=jax.grad(criterion), ) assert isinstance(res.params, jnp.ndarray) @@ -60,10 +60,10 @@ def criterion(x): return x @ x res = minimize( - criterion=criterion, + fun=criterion, params=jnp.arange(3), algorithm="scipy_lbfgsb", - derivative=jax.grad(criterion), + jac=jax.grad(criterion), ) assert isinstance(res.params, jnp.ndarray) @@ -88,10 +88,10 @@ def ls_wrapper(x): } res = minimize( - criterion=criterion, + fun=criterion, params=jnp.array([1.0, 2.0, 3.0]), algorithm=algorithm, - derivative=deriv_dict, + jac=deriv_dict, ) assert isinstance(res.params, jnp.ndarray) @@ -110,10 +110,10 @@ def ls_wrapper(x): jac = jax.jacobian(ls_wrapper) res = minimize( - criterion=criterion, + fun=criterion, params=params, algorithm="scipy_ls_lm", - derivative=jac, + jac=jac, ) assert isinstance(res.params, dict) diff --git a/tests/optimagic/optimization/test_many_algorithms.py b/tests/optimagic/optimization/test_many_algorithms.py index 98586e46e..429354d06 100644 --- a/tests/optimagic/optimization/test_many_algorithms.py +++ b/tests/optimagic/optimization/test_many_algorithms.py @@ -39,7 +39,7 @@ def sos(x): @pytest.mark.parametrize("algorithm", LOCAL_ALGORITHMS) def test_algorithm_on_sum_of_squares(algorithm): res = minimize( - criterion=sos, + fun=sos, params=np.arange(3), algorithm=algorithm, collect_history=True, @@ -52,7 +52,7 @@ def test_algorithm_on_sum_of_squares(algorithm): @pytest.mark.parametrize("algorithm", BOUNDED_ALGORITHMS) def test_algorithm_on_sum_of_squares_with_binding_bounds(algorithm): res = minimize( - criterion=sos, + fun=sos, params=np.array([3, 2, -3]), lower_bounds=np.array([1, -np.inf, -np.inf]), upper_bounds=np.array([np.inf, np.inf, -1]), @@ -75,7 +75,7 @@ def test_algorithm_on_sum_of_squares_with_binding_bounds(algorithm): @pytest.mark.parametrize("algorithm", GLOBAL_ALGORITHMS_AVAILABLE) def test_global_algorithms_on_sum_of_squares(algorithm): res = minimize( - criterion=sos, + fun=sos, params=np.array([0.35, 0.35]), lower_bounds=np.array([0.2, -0.5]), upper_bounds=np.array([1, 0.5]), diff --git a/tests/optimagic/optimization/test_multistart.py b/tests/optimagic/optimization/test_multistart.py index f9b426679..5d1be2209 100644 --- a/tests/optimagic/optimization/test_multistart.py +++ b/tests/optimagic/optimization/test_multistart.py @@ -36,14 +36,14 @@ def test_multistart_minimize_with_sum_of_squares_at_defaults( ): if direction == "minimize": res = minimize( - criterion=criterion, + fun=criterion, params=params, algorithm="scipy_lbfgsb", multistart=True, ) else: res = maximize( - criterion=switch_sign(sos_dict_criterion), + fun=switch_sign(sos_dict_criterion), params=params, algorithm="scipy_lbfgsb", multistart=True, @@ -68,7 +68,7 @@ def test_multistart_with_existing_sample(params): options = {"sample": sample} res = minimize( - criterion=sos_dict_criterion, + fun=sos_dict_criterion, params=params, algorithm="scipy_lbfgsb", multistart=True, @@ -86,7 +86,7 @@ def test_convergence_via_max_discoveries_works(params): } res = maximize( - criterion=switch_sign(sos_dict_criterion), + fun=switch_sign(sos_dict_criterion), params=params, algorithm="scipy_lbfgsb", multistart=True, @@ -103,7 +103,7 @@ def test_steps_are_logged_as_skipped_if_convergence(params): } minimize( - criterion=sos_dict_criterion, + fun=sos_dict_criterion, params=params, algorithm="scipy_lbfgsb", multistart=True, @@ -120,7 +120,7 @@ def test_all_steps_occur_in_optimization_iterations_if_no_convergence(params): options = {"convergence_max_discoveries": np.inf} minimize( - criterion=sos_dict_criterion, + fun=sos_dict_criterion, params=params, algorithm="scipy_lbfgsb", multistart=True, @@ -143,7 +143,7 @@ def test_all_steps_occur_in_optimization_iterations_if_no_convergence(params): def test_with_non_transforming_constraints(params): res = minimize( - criterion=sos_dict_criterion, + fun=sos_dict_criterion, params=params, constraints=[{"loc": [0, 1], "type": "fixed", "value": [0, 1]}], algorithm="scipy_lbfgsb", @@ -156,7 +156,7 @@ def test_with_non_transforming_constraints(params): def test_error_is_raised_with_transforming_constraints(params): with pytest.raises(NotImplementedError): minimize( - criterion=sos_dict_criterion, + fun=sos_dict_criterion, params=params, constraints=[{"loc": [0, 1], "type": "probability"}], algorithm="scipy_lbfgsb", @@ -171,7 +171,7 @@ def _params_list_to_aray(params_list): def test_multistart_with_numpy_params(): res = minimize( - criterion=lambda params: params @ params, + fun=lambda params: params @ params, params=np.arange(5), algorithm="scipy_lbfgsb", soft_lower_bounds=np.full(5, -10), @@ -185,7 +185,7 @@ def test_multistart_with_numpy_params(): def test_with_invalid_bounds(): with pytest.raises(ValueError): minimize( - criterion=lambda x: x @ x, + fun=lambda x: x @ x, params=np.arange(5), algorithm="scipy_neldermead", multistart=True, @@ -198,7 +198,7 @@ def _crit(params): return x @ x res = minimize( - criterion=_crit, + fun=_crit, params=np.full(5, 10), soft_lower_bounds=np.full(5, -1), soft_upper_bounds=np.full(5, 11), @@ -243,7 +243,7 @@ def ackley(x): def test_multistart_with_least_squares_optimizers(): est = minimize( - criterion=sos_dict_criterion, + fun=sos_dict_criterion, params=np.array([-1, 1.0]), lower_bounds=np.full(2, -10.0), upper_bounds=np.full(2, 10.0), diff --git a/tests/optimagic/optimization/test_optimizations_with_scaling.py b/tests/optimagic/optimization/test_optimizations_with_scaling.py index 4679727b6..5d6db79f7 100644 --- a/tests/optimagic/optimization/test_optimizations_with_scaling.py +++ b/tests/optimagic/optimization/test_optimizations_with_scaling.py @@ -41,13 +41,13 @@ def test_optimizations_with_scaling(algorithm, scaling_options): constraints = [{"loc": [3, 4], "type": "fixed"}] res = minimize( - criterion=sos_scalar_criterion, + fun=sos_scalar_criterion, params=params, constraints=constraints, algorithm=algorithm, scaling=True, scaling_options=scaling_options, - derivative=sos_gradient, + jac=sos_gradient, ) expected_solution = np.array([0, 0, 0, 3, 4]) diff --git a/tests/optimagic/optimization/test_optimize.py b/tests/optimagic/optimization/test_optimize.py index 2d3094e4c..e5bc74d5f 100644 --- a/tests/optimagic/optimization/test_optimize.py +++ b/tests/optimagic/optimization/test_optimize.py @@ -28,17 +28,17 @@ def raising_crit_and_deriv(params): # noqa: ARG001 with pytest.raises(InvalidFunctionError, match="Error while evaluating"): minimize( - criterion=sos_scalar_criterion, + fun=sos_scalar_criterion, params=params, algorithm="scipy_lbfgsb", - criterion_and_derivative=raising_crit_and_deriv, + fun_and_jac=raising_crit_and_deriv, ) def test_with_invalid_numdiff_options(): with pytest.raises(InvalidKwargsError): minimize( - criterion=lambda x: x @ x, + fun=lambda x: x @ x, params=np.arange(5), algorithm="scipy_lbfgsb", numdiff_options={"bla": 15}, diff --git a/tests/optimagic/optimization/test_params_versions.py b/tests/optimagic/optimization/test_params_versions.py index 8172d59a8..8557cecac 100644 --- a/tests/optimagic/optimization/test_params_versions.py +++ b/tests/optimagic/optimization/test_params_versions.py @@ -51,7 +51,7 @@ def test_tree_params_numerical_derivative_scalar_criterion(params): expected = np.zeros_like(flat) res = minimize( - criterion=flexible_sos_scalar, + fun=flexible_sos_scalar, params=params, algorithm="scipy_lbfgsb", ) @@ -65,8 +65,8 @@ def test_tree_params_scalar_criterion(params): expected = np.zeros_like(flat) res = minimize( - criterion=flexible_sos_scalar, - derivative=flexible_sos_scalar_derivative, + fun=flexible_sos_scalar, + jac=flexible_sos_scalar_derivative, params=params, algorithm="scipy_lbfgsb", ) @@ -86,7 +86,7 @@ def test_tree_params_numerical_derivative_sos_ls(params, algorithm): expected = np.zeros_like(flat) res = minimize( - criterion=flexible_sos_ls, + fun=flexible_sos_ls, params=params, algorithm=algorithm, ) @@ -105,8 +105,8 @@ def test_tree_params_sos_ls(params, algorithm): } res = minimize( - criterion=flexible_sos_ls, - derivative=derivatives, + fun=flexible_sos_ls, + jac=derivatives, params=params, algorithm=algorithm, ) diff --git a/tests/optimagic/optimization/test_useful_exceptions.py b/tests/optimagic/optimization/test_useful_exceptions.py index f5ace0662..ee5c02fc6 100644 --- a/tests/optimagic/optimization/test_useful_exceptions.py +++ b/tests/optimagic/optimization/test_useful_exceptions.py @@ -16,7 +16,7 @@ def f(params, bla, blubb): # noqa: ARG001 params = pd.DataFrame(np.ones((3, 1)), columns=["value"]) with pytest.raises(InvalidKwargsError): - minimize(f, params, "scipy_lbfgsb", criterion_kwargs={"bla": 3}) + minimize(f, params, "scipy_lbfgsb", fun_kwargs={"bla": 3}) def test_missing_derivative_kwargs(): @@ -29,9 +29,7 @@ def grad(params, bla, blubb): # noqa: ARG001 params = pd.DataFrame(np.ones((3, 1)), columns=["value"]) with pytest.raises(InvalidKwargsError): - minimize( - f, params, "scipy_lbfgsb", derivative=grad, derivative_kwargs={"bla": 3} - ) + minimize(f, params, "scipy_lbfgsb", jac=grad, jac_kwargs={"bla": 3}) def test_missing_criterion_and_derivative_kwargs(): @@ -48,8 +46,8 @@ def f_and_grad(params, bla, blubb): # noqa: ARG001 f, params, "scipy_lbfgsb", - criterion_and_derivative=f_and_grad, - criterion_and_derivative_kwargs={"bla": 3}, + fun_and_jac=f_and_grad, + fun_and_jac_kwargs={"bla": 3}, ) @@ -61,7 +59,7 @@ def f(params, bla, foo): # noqa: ARG001 snippet = "Did you mean" with pytest.raises(InvalidKwargsError, match=snippet): - minimize(f, params, "scipy_lbfgsb", criterion_kwargs={"bla": 3, "foa": 4}) + minimize(f, params, "scipy_lbfgsb", fun_kwargs={"bla": 3, "foa": 4}) def test_criterion_with_runtime_error_derivative_free(): diff --git a/tests/optimagic/optimization/test_with_advanced_constraints.py b/tests/optimagic/optimization/test_with_advanced_constraints.py index d5403f587..d43e52bed 100644 --- a/tests/optimagic/optimization/test_with_advanced_constraints.py +++ b/tests/optimagic/optimization/test_with_advanced_constraints.py @@ -70,10 +70,10 @@ def test_with_covariance_constraint_bounds_distance(derivative, constr_name): params = pd.Series(START_INFO[constr_name], name="value").to_frame() res = minimize( - criterion=sos_scalar_criterion, + fun=sos_scalar_criterion, params=params, algorithm="scipy_lbfgsb", - derivative=derivative, + jac=derivative, constraints=CONSTR_INFO[constr_name], ) diff --git a/tests/optimagic/optimization/test_with_constraints.py b/tests/optimagic/optimization/test_with_constraints.py index af21e59cb..6110387b6 100644 --- a/tests/optimagic/optimization/test_with_constraints.py +++ b/tests/optimagic/optimization/test_with_constraints.py @@ -168,10 +168,10 @@ def test_constrained_minimization( params = np.array(START_INFO[constraint_name]) res = minimize( - criterion=criterion, + fun=criterion, params=params, algorithm=algorithm, - derivative=derivative, + jac=derivative, constraints=constraints, algo_options={"convergence.relative_criterion_tolerance": 1e-12}, ) @@ -191,7 +191,7 @@ def test_constrained_minimization( def test_fix_that_differs_from_start_value_raises_an_error(): with pytest.raises(InvalidParamsError): minimize( - criterion=lambda x: x @ x, + fun=lambda x: x @ x, params=np.arange(3), algorithm="scipy_lbfgsb", constraints=[{"loc": [1], "type": "fixed", "value": 10}], @@ -209,7 +209,7 @@ def test_three_independent_constraints(): ] res = minimize( - criterion=lambda x: x @ x, + fun=lambda x: x @ x, params=params, algorithm="scipy_lbfgsb", constraints=constraints, @@ -235,7 +235,7 @@ def test_incompatible_constraints_raise_errors(constraints): with pytest.raises(InvalidConstraintError): minimize( - criterion=lambda x: x @ x, + fun=lambda x: x @ x, params=params, algorithm="scipy_lbfgsb", constraints=constraints, @@ -258,7 +258,7 @@ def return_all_but_working_hours(params): return out res = maximize( - criterion=u, + fun=u, params=start_params, algorithm="scipy_lbfgsb", constraints=[ @@ -279,7 +279,7 @@ def test_constraint_inheritance(): equality constraint, no matter to which set they were applied originally.""" for loc in [[0, 1], [2, 3]]: res = minimize( - criterion=lambda x: x @ x, + fun=lambda x: x @ x, params=np.array([0.1, 0.9, 0.9, 0.1]), algorithm="scipy_lbfgsb", constraints=[ @@ -314,8 +314,8 @@ def test_covariance_constraint_in_2_by_2_case(): kwargs = {"y": spector_data.endog, "x": x_df.to_numpy()} result = maximize( - criterion=logit_loglike, - criterion_kwargs=kwargs, + fun=logit_loglike, + fun_kwargs=kwargs, params=start_params, algorithm="scipy_lbfgsb", constraints={"loc": [1, 2, 3], "type": "covariance"}, diff --git a/tests/optimagic/optimization/test_with_nonlinear_constraints.py b/tests/optimagic/optimization/test_with_nonlinear_constraints.py index ee7f00726..367a30da8 100644 --- a/tests/optimagic/optimization/test_with_nonlinear_constraints.py +++ b/tests/optimagic/optimization/test_with_nonlinear_constraints.py @@ -169,7 +169,7 @@ def test_documentation_example(algorithm): del kwargs["upper_bounds"] minimize( - criterion=criterion, + fun=criterion, params=np.ones(6), algorithm=algorithm, constraints={ diff --git a/tests/optimagic/visualization/test_history_plots.py b/tests/optimagic/visualization/test_history_plots.py index 903c25e5d..a31c7ecdc 100644 --- a/tests/optimagic/visualization/test_history_plots.py +++ b/tests/optimagic/visualization/test_history_plots.py @@ -13,7 +13,7 @@ def minimize_result(): res = [] for algorithm in ["scipy_neldermead", "scipy_lbfgsb"]: _res = minimize( - criterion=lambda x: x @ x, + fun=lambda x: x @ x, params=np.arange(5), algorithm=algorithm, soft_lower_bounds=np.full(5, -1), @@ -96,7 +96,7 @@ def test_criterion_plot_wrong_results(): def test_criterion_plot_different_input_types(): # logged result minimize( - criterion=lambda x: x @ x, + fun=lambda x: x @ x, params=np.arange(5), algorithm="scipy_lbfgsb", soft_lower_bounds=np.full(5, -1), @@ -108,7 +108,7 @@ def test_criterion_plot_different_input_types(): ) res = minimize( - criterion=lambda x: x @ x, + fun=lambda x: x @ x, params=np.arange(5), algorithm="scipy_lbfgsb", soft_lower_bounds=np.full(5, -1), diff --git a/tests/test_deprecations.py b/tests/test_deprecations.py index d442e2a35..be1d7d465 100644 --- a/tests/test_deprecations.py +++ b/tests/test_deprecations.py @@ -121,7 +121,7 @@ def _crit(params): return x @ x om.minimize( - criterion=_crit, + fun=_crit, params={"a": 1, "b": 2, "c": 3}, algorithm="scipy_lbfgsb", logging=path, From 8cb3d02c975e92147189aab59f5c1100da4cd4ea Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Wed, 17 Jul 2024 13:52:29 +0200 Subject: [PATCH 05/25] Fix deprecation warnings in estimation. --- src/estimagic/estimate_msm.py | 8 ++++---- src/optimagic/optimization/optimize.py | 12 ++++++------ tests/estimagic/test_estimate_ml.py | 10 +++++----- 3 files changed, 15 insertions(+), 15 deletions(-) diff --git a/src/estimagic/estimate_msm.py b/src/estimagic/estimate_msm.py index 1c807118c..562dc6c47 100644 --- a/src/estimagic/estimate_msm.py +++ b/src/estimagic/estimate_msm.py @@ -372,9 +372,9 @@ def get_msm_optimization_functions( jacobian_kwargs (dict): Additional keyword arguments for jacobian. Returns: - dict: Dictionary containing at least the entry "criterion". If enough inputs - are provided it also contains the entries "derivative" and - "criterion_and_derivative". All values are functions that take params + dict: Dictionary containing at least the entry "fun". If enough inputs + are provided it also contains the entries "jac" and + "fun_and_jac". All values are functions that take params as only argument. """ @@ -400,7 +400,7 @@ def get_msm_optimization_functions( registry=registry, ) - out = {"criterion": criterion} + out = {"fun": criterion} if _jacobian is not None: raise NotImplementedError( diff --git a/src/optimagic/optimization/optimize.py b/src/optimagic/optimization/optimize.py index 1dcf8de81..1bf25b03b 100644 --- a/src/optimagic/optimization/optimize.py +++ b/src/optimagic/optimization/optimize.py @@ -263,7 +263,7 @@ def _optimize( "renamed to `fun`. Please use `fun` instead of `criterion`. Using " "`criterion` will become an error in optimagic version 0.6.0 and later." ) - warnings.warn(msg, DeprecationWarning) + warnings.warn(msg, FutureWarning) if fun is None: fun = criterion @@ -275,7 +275,7 @@ def _optimize( "`criterion_kwargs`. Using `criterion_kwargs` will become an error in " "optimagic version 0.6.0 and later." ) - warnings.warn(msg, DeprecationWarning) + warnings.warn(msg, FutureWarning) if fun_kwargs is None: fun_kwargs = criterion_kwargs @@ -286,7 +286,7 @@ def _optimize( "been renamed to `jac`. Please use `jac` instead of `derivative`. Using " "`derivative` will become an error in optimagic version 0.6.0 and later." ) - warnings.warn(msg, DeprecationWarning) + warnings.warn(msg, FutureWarning) if jac is None: jac = derivative @@ -298,7 +298,7 @@ def _optimize( "`derivative_kwargs`. Using `derivative_kwargs` will become an error in " "optimagic version 0.6.0 and later." ) - warnings.warn(msg, DeprecationWarning) + warnings.warn(msg, FutureWarning) if jac_kwargs is None: jac_kwargs = derivative_kwargs @@ -310,7 +310,7 @@ def _optimize( "instead of `criterion_and_derivative`. Using `criterion_and_derivative` " "will become an error in optimagic version 0.6.0 and later." ) - warnings.warn(msg, DeprecationWarning) + warnings.warn(msg, FutureWarning) if fun_and_jac is None: fun_and_jac = criterion_and_derivative @@ -323,7 +323,7 @@ def _optimize( "`criterion_and_derivative_kwargs`. Using `criterion_and_derivative_kwargs`" " will become an error in optimagic version 0.6.0 and later." ) - warnings.warn(msg, DeprecationWarning) + warnings.warn(msg, FutureWarning) if fun_and_jac_kwargs is None: fun_and_jac_kwargs = criterion_and_derivative_kwargs diff --git a/tests/estimagic/test_estimate_ml.py b/tests/estimagic/test_estimate_ml.py index 17245517d..5df2002a2 100644 --- a/tests/estimagic/test_estimate_ml.py +++ b/tests/estimagic/test_estimate_ml.py @@ -131,7 +131,7 @@ def logit_loglike_and_derivative(params, y, x): "scipy_lbfgsb", { "algorithm": "scipy_lbfgsb", - "criterion_and_derivative": logit_loglike_and_derivative, + "fun_and_jac": logit_loglike_and_derivative, }, ], # optimize_options [None, logit_jacobian, False], # jacobian @@ -160,8 +160,8 @@ def test_estimate_ml_with_logit_no_constraints( kwargs = {"y": logit_np_inputs["y"], "x": logit_np_inputs["x"]} - if "criterion_and_derivative" in optimize_options: - optimize_options["criterion_and_derivative_kwargs"] = kwargs + if "fun_and_jac" in optimize_options: + optimize_options["fun_and_jac_kwargs"] = kwargs got = estimate_ml( loglike=logit_loglike, @@ -268,8 +268,8 @@ def test_estimate_ml_with_logit_constraints( "algo_options": {"convergence.relative_criterion_tolerance": 1e-12}, } - if "criterion_and_derivative" in optimize_options: - optimize_options["criterion_and_derivative_kwargs"] = kwargs + if "fun_and_jac" in optimize_options: + optimize_options["fun_and_jac_kwargs"] = kwargs got = estimate_ml( loglike=logit_loglike, From 6b21ff12485209e85b762af5980b8fd9fc631df1 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Wed, 17 Jul 2024 14:05:55 +0200 Subject: [PATCH 06/25] Fix remaining deprecation warnings. --- src/optimagic/benchmarking/cartis_roberts.py | 120 +++++++++--------- .../benchmarking/get_benchmark_problems.py | 10 +- src/optimagic/benchmarking/more_wild.py | 108 ++++++++-------- src/optimagic/benchmarking/run_benchmark.py | 2 +- .../benchmarking/test_cartis_roberts.py | 4 +- .../test_get_benchmark_problems.py | 2 +- .../optimagic/benchmarking/test_more_wild.py | 2 +- .../benchmarking/test_run_benchmark.py | 16 +-- .../optimagic/optimization/test_multistart.py | 2 +- 9 files changed, 133 insertions(+), 133 deletions(-) diff --git a/src/optimagic/benchmarking/cartis_roberts.py b/src/optimagic/benchmarking/cartis_roberts.py index d54102c90..6a827ba05 100644 --- a/src/optimagic/benchmarking/cartis_roberts.py +++ b/src/optimagic/benchmarking/cartis_roberts.py @@ -4849,7 +4849,7 @@ def get_start_points_methanl8(): CARTIS_ROBERTS_PROBLEMS = { "arglale": { # arglale is the same as linear_full_rank with specific settings - "criterion": partial(linear_full_rank, dim_out=400), + "fun": partial(linear_full_rank, dim_out=400), "start_x": [1] * 100, "solution_x": [-0.99999952] * 100, "start_criterion": 700, @@ -4857,98 +4857,98 @@ def get_start_points_methanl8(): }, "arglble": { # arglble is the same as linear_rank_one with specific settings - "criterion": partial(linear_rank_one, dim_out=400), + "fun": partial(linear_rank_one, dim_out=400), "start_x": [1] * 100, "solution_x": solution_x_arglble, "start_criterion": 5.460944e14, "solution_criterion": 99.62547, }, "argtrig": { - "criterion": argtrig, + "fun": argtrig, "start_x": [1 / 100] * 100, "solution_x": [0] * 100, "start_criterion": 32.99641, "solution_criterion": 0, }, "artif": { - "criterion": artif, + "fun": artif, "start_x": [1] * 100, "solution_x": None, "start_criterion": 36.59115, "solution_criterion": 0, }, "arwhdne": { - "criterion": arwhdne, + "fun": arwhdne, "start_x": [1] * 100, "solution_x": [0.706011] * 99 + [0], "start_criterion": 495, "solution_criterion": 27.66203, }, "bdvalues": { - "criterion": bdvalues, + "fun": bdvalues, "start_x": get_start_points_bdvalues(100, 1000), "solution_x": solution_x_bdvalues, "start_criterion": 1.943417e7, "solution_criterion": 0, }, "bratu_2d": { - "criterion": partial(bratu_2d, alpha=4), + "fun": partial(bratu_2d, alpha=4), "start_x": [0] * 64, "solution_x": solution_x_bratu_2d, "start_criterion": 0.1560738, "solution_criterion": 0, }, "bratu_2d_t": { - "criterion": partial(bratu_2d, alpha=6.80812), + "fun": partial(bratu_2d, alpha=6.80812), "start_x": [0] * 64, "solution_x": solution_x_bratu_2d_t, "start_criterion": 0.4521311, "solution_criterion": 1.8534736e-05, }, "bratu_3d": { - "criterion": partial(bratu_3d, alpha=6.80812), + "fun": partial(bratu_3d, alpha=6.80812), "start_x": [0] * 27, "solution_x": solution_x_bratu_3d, "start_criterion": 4.888529, "solution_criterion": 0, }, "brownale": { - "criterion": brown_almost_linear, + "fun": brown_almost_linear, "start_x": [0.5] * 100, "solution_x": [1] * 100, "start_criterion": 2.524757e5, "solution_criterion": 0, }, "broydn_3d": { - "criterion": broydn_3d, + "fun": broydn_3d, "start_x": [-1] * 100, "solution_x": solution_x_broydn_3d, "start_criterion": 111, "solution_criterion": 0, }, "cbratu_2d": { - "criterion": cbratu_2d, + "fun": cbratu_2d, "start_x": [0] * (2 * 5 * 5), "solution_x": solution_x_cbratu_2d, "start_criterion": 0.4822531, "solution_criterion": 0, }, "broydn_bd": { - "criterion": broydn_bd, + "fun": broydn_bd, "start_x": [1] * 100, "solution_x": solution_x_broydn_bd, "start_criterion": 2404, "solution_criterion": 0, }, "chandheq": { - "criterion": chandheq, + "fun": chandheq, "start_x": (np.arange(1, 101) / 100).tolist(), "solution_x": None, "start_criterion": 6.923365, "solution_criterion": 0, }, "chemrcta": { - "criterion": chemrcta, + "fun": chemrcta, "start_x": [1] * 100, "solution_x": None, "start_criterion": 3.0935, @@ -4956,7 +4956,7 @@ def get_start_points_methanl8(): "lower_bounds": np.concatenate([np.zeros(50), 1e-6 * np.ones(50)]), }, "chemrctb": { - "criterion": chemrctb, + "fun": chemrctb, "start_x": [1] * 100, "solution_x": solution_x_chemrctb, "start_criterion": 1.446513, @@ -4964,35 +4964,35 @@ def get_start_points_methanl8(): "lower_bounds": 1e-6 * np.ones(100), }, "chnrsbne": { - "criterion": chnrsbne, + "fun": chnrsbne, "start_x": [-1] * 50, "solution_x": [1] * 50, "start_criterion": 7635.84, "solution_criterion": 0, }, "drcavty1": { - "criterion": partial(drcavty, r=500), + "fun": partial(drcavty, r=500), "start_x": [0] * 100, "solution_x": None, "start_criterion": 0.4513889, "solution_criterion": 0, }, "drcavty2": { - "criterion": partial(drcavty, r=1000), + "fun": partial(drcavty, r=1000), "start_x": [0] * 100, "solution_x": solution_x_drcavty2, "start_criterion": 0.4513889, "solution_criterion": 3.988378e-4, }, "drcavty3": { - "criterion": partial(drcavty, r=4500), + "fun": partial(drcavty, r=4500), "start_x": [0] * 100, "solution_x": solution_x_drcavty3, "start_criterion": 0.4513889, "solution_criterion": 0, }, "eigena": { - "criterion": partial(eigen, param=np.diag(np.arange(1, 11))), + "fun": partial(eigen, param=np.diag(np.arange(1, 11))), "start_x": [1] * 10 + np.eye(10).flatten().tolist(), "solution_x": [*np.arange(1, 11).tolist(), 1] + ([0] * 10 + [1]) * 9, "start_criterion": 285, @@ -5000,7 +5000,7 @@ def get_start_points_methanl8(): "lower_bounds": np.zeros(110), }, "eigenb": { - "criterion": partial( + "fun": partial( eigen, param=np.diag(2 * np.ones(10)) + np.diag(-np.ones(9), k=1) ), "start_x": [1] * 10 + np.eye(10).flatten().tolist(), @@ -5011,7 +5011,7 @@ def get_start_points_methanl8(): # according to table 3 in their paper, the minimum is at 0. }, "flosp2hh": { - "criterion": partial( + "fun": partial( flosp2, a=np.array([1, 0, -1], dtype=np.int64), b=np.array([1, 0, -1], dtype=np.int64), @@ -5023,7 +5023,7 @@ def get_start_points_methanl8(): "solution_criterion": 1 / 3, }, "flosp2hl": { - "criterion": partial( + "fun": partial( flosp2, a=np.array([1, 0, -1], dtype=np.float64), b=np.array([1, 0, -1], dtype=np.float64), @@ -5035,7 +5035,7 @@ def get_start_points_methanl8(): "solution_criterion": 1 / 3, }, "flosp2hm": { - "criterion": partial( + "fun": partial( flosp2, a=np.array([1, 0, -1], dtype=np.float64), b=np.array([1, 0, -1], dtype=np.float64), @@ -5047,7 +5047,7 @@ def get_start_points_methanl8(): "solution_criterion": 1 / 3, }, "flosp2th": { - "criterion": partial( + "fun": partial( flosp2, a=np.array([0, 1, 0], dtype=np.float64), b=np.array([0, 1, 1], dtype=np.float64), @@ -5059,7 +5059,7 @@ def get_start_points_methanl8(): "solution_criterion": 0, }, "flosp2tl": { - "criterion": partial( + "fun": partial( flosp2, a=np.array([0, 1, 0], dtype=np.float64), b=np.array([0, 1, 1], dtype=np.float64), @@ -5071,7 +5071,7 @@ def get_start_points_methanl8(): "solution_criterion": 0, }, "flosp2tm": { - "criterion": partial( + "fun": partial( flosp2, a=np.array([0, 1, 0], dtype=np.float64), b=np.array([0, 1, 1], dtype=np.float64), @@ -5083,49 +5083,49 @@ def get_start_points_methanl8(): "solution_criterion": 0, }, "freurone": { - "criterion": freurone, + "fun": freurone, "start_x": [0.5, -2] + [0] * 98, "solution_x": solution_x_freurone, "start_criterion": 9.95565e4, "solution_criterion": 1.196458e4, }, "hatfldg": { - "criterion": hatfldg, + "fun": hatfldg, "start_x": [1] * 25, "solution_x": [0] * 11 + [-1, 1] + [0] * 12, "start_criterion": 27, "solution_criterion": 0, }, "hydcar20": { - "criterion": partial(hydcar, n=20, m=3, k=9), + "fun": partial(hydcar, n=20, m=3, k=9), "start_x": get_start_points_hydcar20(), "solution_x": solution_x_hydcar20, "start_criterion": 1341.663, "solution_criterion": 0, }, "hydcar6": { - "criterion": partial(hydcar, n=6, m=3, k=2), + "fun": partial(hydcar, n=6, m=3, k=2), "start_x": get_start_points_hydcar6(), "solution_x": solution_x_hydcar6, "start_criterion": 704.1073, "solution_criterion": 0, }, "integreq": { - "criterion": integreq, + "fun": integreq, "start_x": (np.arange(1, 101) / 101 * (np.arange(1, 101) / 101 - 1)).tolist(), "solution_x": solution_x_integreq, "start_criterion": 0.5730503, "solution_criterion": 0, }, "luksan11": { - "criterion": luksan11, + "fun": luksan11, "start_x": [-0.8] * 100, "solution_x": [1] * 100, "start_criterion": 626.0640, "solution_criterion": 0, }, "luksan12": { - "criterion": luksan12, + "fun": luksan12, "start_x": [-1] * 98, "solution_x": None, "start_criterion": 3.2160e4, @@ -5136,7 +5136,7 @@ def get_start_points_methanl8(): # That is why we disable this test function for the time being. }, "luksan13": { - "criterion": luksan13, + "fun": luksan13, "start_x": [-1] * 98, "solution_x": solution_x_luksan13, "start_criterion": 6.4352e4, @@ -5145,112 +5145,112 @@ def get_start_points_methanl8(): # according to table 3 in their paper, the minimum is at 25188.86 }, "luksan14": { - "criterion": luksan14, + "fun": luksan14, "start_x": [-1] * 98, "solution_x": solution_x_luksan14, "start_criterion": 2.6880e4, "solution_criterion": 123.9235, }, "luksan15": { - "criterion": luksan15, + "fun": luksan15, "start_x": [-0.8, 1.2, -1.2, 0.8] * 25, "solution_x": solution_x_luksan15, "start_criterion": 2.701585e4, "solution_criterion": 3.569697, }, "luksan16": { - "criterion": luksan16, + "fun": luksan16, "start_x": [-0.8, 1.2, -1.2, 0.8] * 25, "solution_x": solution_x_luksan16, "start_criterion": 1.306848e4, "solution_criterion": 3.569697, }, "luksan17": { - "criterion": luksan17, + "fun": luksan17, "start_x": [-0.8, 1.2, -1.2, 0.8] * 25, "solution_x": None, # multiple argmins "start_criterion": 1.687370e6, "solution_criterion": 0.4931613, }, "luksan21": { - "criterion": luksan21, + "fun": luksan21, "start_x": [ih * (ih - 1) for ih in np.arange(1, 101) * (1 / 101)], "solution_x": solution_x_luksan21, "start_criterion": 99.98751, "solution_criterion": 0, }, "luksan22": { - "criterion": luksan22, + "fun": luksan22, "start_x": [-1.2 if i % 2 == 0 else 1 for i in range(100)], "solution_x": solution_x_luksan22, "start_criterion": 2.487686e4, "solution_criterion": 872.9230, }, "methanb8": { - "criterion": methane, + "fun": methane, "start_x": get_start_points_methanb8(), "solution_x": solution_x_methane, "start_criterion": 1.043105, "solution_criterion": 0, }, "methanl8": { - "criterion": methane, + "fun": methane, "start_x": get_start_points_methanl8(), "solution_x": solution_x_methane, "start_criterion": 4345.100, "solution_criterion": 0, }, "morebvne": { - "criterion": morebvne, + "fun": morebvne, "start_x": [t * (t - 1) for t in np.arange(1, 101) * (1 / 101)], "solution_x": solution_x_morebvne, "start_criterion": 3.633100e-4, "solution_criterion": 0, }, "msqrta": { - "criterion": msqrta, + "fun": msqrta, "start_x": get_start_points_msqrta(10), "solution_x": solution_x_msqrta, "start_criterion": 212.7162, "solution_criterion": 0, }, "msqrtb": { - "criterion": msqrta, + "fun": msqrta, "start_x": get_start_points_msqrta(10, flag=2), "solution_x": solution_x_msqrtb, "start_criterion": 205.0753, "solution_criterion": 0, }, "oscigrne": { - "criterion": oscigrne, + "fun": oscigrne, "start_x": [-2] + [1] * 99, "solution_x": solution_x_oscigrne, "start_criterion": 6.120720e8, "solution_criterion": 0, }, "penalty_1": { - "criterion": penalty_1, + "fun": penalty_1, "start_x": list(range(1, 101)), "solution_x": None, "start_criterion": 1.144806e11, "solution_criterion": 9.025000e-9, }, "penalty_2": { - "criterion": penalty_2, + "fun": penalty_2, "start_x": [0.5] * 100, "solution_x": solution_x_penalty2, "start_criterion": 1.591383e6, "solution_criterion": 0.9809377, }, "powellse": { - "criterion": powell_singular, + "fun": powell_singular, "start_x": [3.0, -1.0, 0.0, 1] * 25, "solution_x": [0] * 100, "start_criterion": 41875, "solution_criterion": 0, }, "qr3d": { - "criterion": partial(qr3d, m=5), + "fun": partial(qr3d, m=5), "start_x": get_start_points_qr3d(5), "solution_x": solution_x_qr3d, "start_criterion": 1.2, @@ -5259,7 +5259,7 @@ def get_start_points_methanl8(): + [0 if i == j else -np.inf for i in range(5) for j in range(5)], }, "qr3dbd": { - "criterion": partial(qr3dbd, m=5), + "fun": partial(qr3dbd, m=5), "start_x": get_start_points_qr3dbd(5), "solution_x": solution_x_qr3dbd, "start_criterion": 1.2, @@ -5268,21 +5268,21 @@ def get_start_points_methanl8(): + [0 if i == j else -np.inf for i in range(5) for j in range(5)], }, "spmsqrt": { - "criterion": spmsqrt, + "fun": spmsqrt, "start_x": get_start_points_spmsqrt(34), "solution_x": solution_x_spmsqrt, "start_criterion": 74.33542, "solution_criterion": 0, }, "semicn2u": { - "criterion": semicon2, + "fun": semicon2, "start_x": [0] * 100, "solution_x": solution_x_semicon2, "start_criterion": 2.025037e4, "solution_criterion": 0, }, "semicon2": { - "criterion": semicon2, + "fun": semicon2, "start_x": [0] * 100, "solution_x": solution_x_semicon2, "start_criterion": 2.025037e4, @@ -5291,28 +5291,28 @@ def get_start_points_methanl8(): "upper_bounds": 0.2 * 700 * np.ones(100), }, "vardimne": { - "criterion": vardimne, + "fun": vardimne, "start_x": [1 - i / 100 for i in range(1, 101)], "solution_x": [1] * 100, "start_criterion": 1.310584e14, "solution_criterion": 0, }, "watsonne": { - "criterion": watson, + "fun": watson, "start_x": [0] * 31, "solution_x": solution_x_watson, "start_criterion": 30, "solution_criterion": 0, }, "yatpsq_1": { - "criterion": partial(yatpsq_1, dim_in=10), + "fun": partial(yatpsq_1, dim_in=10), "start_x": [6] * 100 + [0] * 20, "solution_x": solution_x_yatpsq_1, "start_criterion": 2.073643e6, "solution_criterion": 0, }, "yatpsq_2": { - "criterion": partial(yatpsq_2, dim_in=10), + "fun": partial(yatpsq_2, dim_in=10), "start_x": [10] * 100 + [0] * 20, "solution_x": solution_x_yatpsq_2, "start_criterion": 1.831687e5, diff --git a/src/optimagic/benchmarking/get_benchmark_problems.py b/src/optimagic/benchmarking/get_benchmark_problems.py index 713092484..5473e6204 100644 --- a/src/optimagic/benchmarking/get_benchmark_problems.py +++ b/src/optimagic/benchmarking/get_benchmark_problems.py @@ -116,7 +116,7 @@ def get_benchmark_problems( problems[prob_name] = { "inputs": inputs, - "noise_free_criterion": specification["criterion"], + "noise_free_fun": specification["fun"], "solution": _create_problem_solution( specification, scaling_options=scaling_options ), @@ -192,9 +192,9 @@ def _get_raw_problems(name): raw_problems[k] = v if k in subset_add_steps: problem = v.copy() - raw_func = problem["criterion"] + raw_func = problem["fun"] - problem["criterion"] = partial(_step_func, raw_func=raw_func) + problem["fun"] = partial(_step_func, raw_func=raw_func) raw_problems[f"{k}_with_steps"] = problem for k, v in CARTIS_ROBERTS_PROBLEMS.items(): @@ -223,14 +223,14 @@ def _create_problem_inputs( _criterion = partial( _internal_criterion_template, - criterion=specification["criterion"], + criterion=specification["fun"], additive_options=additive_options, multiplicative_options=multiplicative_options, scaling_factor=scaling_factor, rng=rng, ) - inputs = {"criterion": _criterion, "params": _x} + inputs = {"fun": _criterion, "params": _x} return inputs diff --git a/src/optimagic/benchmarking/more_wild.py b/src/optimagic/benchmarking/more_wild.py index 250c155b6..b842840d2 100644 --- a/src/optimagic/benchmarking/more_wild.py +++ b/src/optimagic/benchmarking/more_wild.py @@ -762,21 +762,21 @@ def get_start_points_mancino(n, a=1): MORE_WILD_PROBLEMS = { "linear_full_rank_good_start": { - "criterion": partial(linear_full_rank, dim_out=45), + "fun": partial(linear_full_rank, dim_out=45), "start_x": [1] * 9, "solution_x": linear_full_rank_solution_x, "start_criterion": 72, "solution_criterion": 36, }, "linear_full_rank_bad_start": { - "criterion": partial(linear_full_rank, dim_out=45), + "fun": partial(linear_full_rank, dim_out=45), "start_x": [10] * 9, "solution_x": linear_full_rank_solution_x, "start_criterion": 1125, "solution_criterion": 36, }, "linear_rank_one_good_start": { - "criterion": partial(linear_rank_one, dim_out=35), + "fun": partial(linear_rank_one, dim_out=35), "start_x": [1] * 7, # no unique solution "solution_x": None, @@ -784,7 +784,7 @@ def get_start_points_mancino(n, a=1): "solution_criterion": 8.380281690143324, }, "linear_rank_one_bad_start": { - "criterion": partial(linear_rank_one, dim_out=35), + "fun": partial(linear_rank_one, dim_out=35), "start_x": [10] * 7, # no unique solution "solution_x": None, @@ -792,7 +792,7 @@ def get_start_points_mancino(n, a=1): "solution_criterion": 8.380282, }, "linear_rank_one_zero_columns_rows_good_start": { - "criterion": partial(linear_rank_one_zero_columns_rows, dim_out=35), + "fun": partial(linear_rank_one_zero_columns_rows, dim_out=35), "start_x": [1] * 7, # no unique solution "solution_x": None, @@ -800,7 +800,7 @@ def get_start_points_mancino(n, a=1): "solution_criterion": 9.880597014926506, }, "linear_rank_one_zero_columns_rows_bad_start": { - "criterion": partial(linear_rank_one_zero_columns_rows, dim_out=35), + "fun": partial(linear_rank_one_zero_columns_rows, dim_out=35), "start_x": [10] * 7, # no unique solution "solution_x": None, @@ -808,77 +808,77 @@ def get_start_points_mancino(n, a=1): "solution_criterion": 9.880597014926506, }, "rosenbrock_good_start": { - "criterion": rosenbrock, + "fun": rosenbrock, "start_x": [-1.2, 1], "solution_x": [1, 1], "start_criterion": 24.2, "solution_criterion": 0, }, "rosenbrock_bad_start": { - "criterion": rosenbrock, + "fun": rosenbrock, "start_x": [-12, 10], "solution_x": [1, 1], "start_criterion": 1.795769e6, "solution_criterion": 0, }, "helical_valley_good_start": { - "criterion": helical_valley, + "fun": helical_valley, "start_x": [-1, 0, 0], "solution_x": [1, 0, 0], "start_criterion": 2500, "solution_criterion": 0, }, "helical_valley_bad_start": { - "criterion": helical_valley, + "fun": helical_valley, "start_x": [-10, 0, 0], "solution_x": [1, 0, 0], "start_criterion": 10600, "solution_criterion": 0, }, "powell_singular_good_start": { - "criterion": powell_singular, + "fun": powell_singular, "start_x": [3, -1, 0, 1], "solution_x": [0] * 4, "start_criterion": 215, "solution_criterion": 0, }, "powell_singular_bad_start": { - "criterion": powell_singular, + "fun": powell_singular, "start_x": [30, -10, 0, 10], "solution_x": [0] * 4, "start_criterion": 1.615400e6, "solution_criterion": 0, }, "freudenstein_roth_good_start": { - "criterion": freudenstein_roth, + "fun": freudenstein_roth, "start_x": [0.5, -2], "solution_x": freudenstein_roth_solution_x, "start_criterion": 400.5, "solution_criterion": 48.984253679240013, }, "freudenstein_roth_bad_start": { - "criterion": freudenstein_roth, + "fun": freudenstein_roth, "start_x": [5, -20], "solution_x": freudenstein_roth_solution_x, "start_criterion": 1.545754e8, "solution_criterion": 48.984253679240013, }, "bard_good_start": { - "criterion": partial(bard, y=y_vec), + "fun": partial(bard, y=y_vec), "start_x": [1] * 3, "solution_x": bard_solution_x, "start_criterion": 41.68170, "solution_criterion": 0.00821487730657897, }, "bard_bad_start": { - "criterion": partial(bard, y=y_vec), + "fun": partial(bard, y=y_vec), "start_x": [10] * 3, "solution_x": bard_solution_x, "start_criterion": 1306.234, "solution_criterion": 0.00821487730657897, }, "kowalik_osborne": { - "criterion": partial( + "fun": partial( kowalik_osborne, y1=v_vec, y2=y2_vec, @@ -889,245 +889,245 @@ def get_start_points_mancino(n, a=1): "solution_criterion": 0.00030750560384924, }, "meyer": { - "criterion": partial(meyer, y=y3_vec), + "fun": partial(meyer, y=y3_vec), "start_x": [0.02, 4000, 250], "solution_x": meyer_solution_x, "start_criterion": 1.693608e9, "solution_criterion": 87.945855170395831, }, "watson_6_good_start": { - "criterion": watson, + "fun": watson, "start_x": [0.5] * 6, "solution_x": watson_6_solution_x, "start_criterion": 16.43083, "solution_criterion": 0.00228767005355236, }, "watson_6_bad_start": { - "criterion": watson, + "fun": watson, "start_x": [5] * 6, "solution_x": watson_6_solution_x, "start_criterion": 2.323367e6, "solution_criterion": 0.00228767005355236, }, "watson_9_good_start": { - "criterion": watson, + "fun": watson, "start_x": [0.5] * 9, "solution_x": watson_9_solution_x, "start_criterion": 26.90417, "solution_criterion": 1.399760e-6, }, "watson_9_bad_start": { - "criterion": watson, + "fun": watson, "start_x": [5] * 9, "solution_x": watson_9_solution_x, "start_criterion": 8.158877e6, "solution_criterion": 1.399760e-6, }, "watson_12_good_start": { - "criterion": watson, + "fun": watson, "start_x": [0.5] * 12, "solution_x": watson_12_solution_x, "start_criterion": 73.67821, "solution_criterion": 4.722381e-10, }, "watson_12_bad_start": { - "criterion": watson, + "fun": watson, "start_x": [5] * 12, "solution_x": watson_12_solution_x, "start_criterion": 2.059384e7, "solution_criterion": 4.722381e-10, }, "box_3d": { - "criterion": partial(box_3d, dim_out=10), + "fun": partial(box_3d, dim_out=10), "start_x": [0, 10, 20], "solution_x": [1, 10, 1], "start_criterion": 1031.154, "solution_criterion": 0, }, "jennrich_sampson": { - "criterion": partial(jennrich_sampson, dim_out=10), + "fun": partial(jennrich_sampson, dim_out=10), "start_x": [0.3, 0.4], "solution_x": [0.2578252135686162] * 2, "start_criterion": 4171.306, "solution_criterion": 124.3621823556148, }, "brown_dennis_good_start": { - "criterion": partial(brown_dennis, dim_out=20), + "fun": partial(brown_dennis, dim_out=20), "start_x": [25, 5, -5, -1], "solution_x": brown_dennis_solution_x, "start_criterion": 7.926693e6, "solution_criterion": 85822.20162635, }, "brown_dennis_bad_start": { - "criterion": partial(brown_dennis, dim_out=20), + "fun": partial(brown_dennis, dim_out=20), "start_x": [250, 50, -50, -10], "solution_x": brown_dennis_solution_x, "start_criterion": 3.081064e11, "solution_criterion": 85822.20162635, }, "chebyquad_6": { - "criterion": partial(chebyquad, dim_out=6), + "fun": partial(chebyquad, dim_out=6), "start_x": [i / 7 for i in range(1, 7)], "solution_x": chebyquad_6_solution_x, "start_criterion": 4.642817e-2, "solution_criterion": 0, }, "chebyquad_7": { - "criterion": partial(chebyquad, dim_out=7), + "fun": partial(chebyquad, dim_out=7), "start_x": [i / 8 for i in range(1, 8)], "solution_x": chebyquad_7_solution_x, "start_criterion": 3.377064e-2, "solution_criterion": 0, }, "chebyquad_8": { - "criterion": partial(chebyquad, dim_out=8), + "fun": partial(chebyquad, dim_out=8), "start_x": [i / 9 for i in range(1, 9)], "solution_x": chebyquad_8_solution_x, "start_criterion": 3.861770e-2, "solution_criterion": 0.003516873725677, }, "chebyquad_9": { - "criterion": partial(chebyquad, dim_out=9), + "fun": partial(chebyquad, dim_out=9), "start_x": [i / 10 for i in range(1, 10)], "solution_x": chebyquad_9_solution_x, "start_criterion": 2.888298e-2, "solution_criterion": 0, }, "chebyquad_10": { - "criterion": partial(chebyquad, dim_out=10), + "fun": partial(chebyquad, dim_out=10), "start_x": [i / 11 for i in range(1, 11)], "solution_x": chebyquad_10_solution_x, "start_criterion": 3.376327e-2, "solution_criterion": 0.00477271369637536, }, "chebyquad_11": { - "criterion": partial(chebyquad, dim_out=11), + "fun": partial(chebyquad, dim_out=11), "start_x": [i / 12 for i in range(1, 12)], "solution_x": chebyquad_11_solution_x, "start_criterion": 2.674060e-2, "solution_criterion": 0.00279976155186576, }, "brown_almost_linear": { - "criterion": brown_almost_linear, + "fun": brown_almost_linear, "start_x": [0.5] * 10, "solution_x": [1] * 10, "start_criterion": 273.2480, "solution_criterion": 0, }, "osborne_one": { - "criterion": partial(osborne_one, y=y4_vec), + "fun": partial(osborne_one, y=y4_vec), "start_x": [0.5, 1.5, 1, 0.01, 0.02], "solution_x": osborne_one_solution_x, "start_criterion": 16.17411, "solution_criterion": 0.00005464894697483, }, "osborne_two_good_start": { - "criterion": partial(osborne_two, y=y5_vec), + "fun": partial(osborne_two, y=y5_vec), "start_x": [1.3, 0.65, 0.65, 0.7, 0.6, 3, 5, 7, 2, 4.5, 5.5], "solution_x": osborne_two_solution_x, "start_criterion": 2.093420, "solution_criterion": 0.0401377362935477, }, "osborne_two_bad_start": { - "criterion": partial(osborne_two, y=y5_vec), + "fun": partial(osborne_two, y=y5_vec), "start_x": [13, 6.5, 6.5, 7, 6, 30, 50, 70, 20, 45, 55], "solution_x": osborne_two_solution_x, "start_criterion": 199.6847, "solution_criterion": 0.0401377362935477, }, "bdqrtic_8": { - "criterion": bdqrtic, + "fun": bdqrtic, "start_x": [1] * 8, "solution_x": bdqrtic_8_solution_x, "start_criterion": 904, "solution_criterion": 10.2389734213174, }, "bdqrtic_10": { - "criterion": bdqrtic, + "fun": bdqrtic, "start_x": [1] * 10, "solution_x": bdqrtic_10_solution_x, "start_criterion": 1356, "solution_criterion": 18.28116175359353, }, "bdqrtic_11": { - "criterion": bdqrtic, + "fun": bdqrtic, "start_x": [1] * 11, "solution_x": bdqrtic_11_solution_x, "start_criterion": 1582, "solution_criterion": 22.260591734883817, }, "bdqrtic_12": { - "criterion": bdqrtic, + "fun": bdqrtic, "start_x": [1] * 12, "solution_x": bdqrtic_12_solution_x, "start_criterion": 1808, "solution_criterion": 26.2727663967939, }, "cube_5": { - "criterion": cube, + "fun": cube, "start_x": [0.5] * 5, "solution_x": [1] * 5, "start_criterion": 56.5, "solution_criterion": 0, }, "cube_6": { - "criterion": cube, + "fun": cube, "start_x": [0.5] * 6, "solution_x": [1] * 6, "start_criterion": 70.5625, "solution_criterion": 0, }, "cube_8": { - "criterion": cube, + "fun": cube, "start_x": [0.5] * 8, "solution_x": [1] * 8, "start_criterion": 98.6875, "solution_criterion": 0, }, "mancino_5_good_start": { - "criterion": mancino, + "fun": mancino, "start_x": get_start_points_mancino(5), "solution_x": mancino_5_solution_x, "start_criterion": 2.539084e9, "solution_criterion": 0, }, "mancino_5_bad_start": { - "criterion": mancino, + "fun": mancino, "start_x": get_start_points_mancino(5, 10), "solution_x": mancino_5_solution_x, "start_criterion": 6.873795e12, "solution_criterion": 0, }, "mancino_8": { - "criterion": mancino, + "fun": mancino, "start_x": get_start_points_mancino(8), "solution_x": mancino_8_solution_x, "start_criterion": 3.367961e9, "solution_criterion": 0, }, "mancino_10": { - "criterion": mancino, + "fun": mancino, "start_x": get_start_points_mancino(10), "solution_x": mancino_10_solution_x, "start_criterion": 3.735127e9, "solution_criterion": 0, }, "mancino_12_good_start": { - "criterion": mancino, + "fun": mancino, "start_x": get_start_points_mancino(12), "solution_x": mancino_12_solution_x, "start_criterion": 3.991072e9, "solution_criterion": 0, }, "mancino_12_bad_start": { - "criterion": mancino, + "fun": mancino, "start_x": get_start_points_mancino(12, 10), "solution_x": mancino_12_solution_x, "start_criterion": 1.130015e13, "solution_criterion": 0, }, "heart_eight_good_start": { - "criterion": partial( + "fun": partial( heart_eight, y=np.array([-0.69, -0.044, -1.57, -1.31, -2.65, 2, -12.6, 9.48]), ), @@ -1137,7 +1137,7 @@ def get_start_points_mancino(n, a=1): "solution_criterion": 0, }, "heart_eight_bad_start": { - "criterion": partial( + "fun": partial( heart_eight, y=np.array([-0.69, -0.044, -1.57, -1.31, -2.65, 2, -12.6, 9.48]), ), @@ -1147,7 +1147,7 @@ def get_start_points_mancino(n, a=1): "solution_criterion": 0, }, "brown_almost_linear_medium": { - "criterion": brown_almost_linear, + "fun": brown_almost_linear, "start_x": [0.5] * 100, "solution_x": [1] * 100, "start_criterion": 2.524757e5, diff --git a/src/optimagic/benchmarking/run_benchmark.py b/src/optimagic/benchmarking/run_benchmark.py index 128c02d0a..1a07ea273 100644 --- a/src/optimagic/benchmarking/run_benchmark.py +++ b/src/optimagic/benchmarking/run_benchmark.py @@ -181,7 +181,7 @@ def _process_one_result(optimize_result, problem): """ _registry = get_registry(extended=True) - _criterion = problem["noise_free_criterion"] + _criterion = problem["noise_free_fun"] _start_x = problem["inputs"]["params"] _start_crit_value = _criterion(_start_x) if isinstance(_start_crit_value, np.ndarray): diff --git a/tests/optimagic/benchmarking/test_cartis_roberts.py b/tests/optimagic/benchmarking/test_cartis_roberts.py index 6aac6fd5d..b5a5ab53b 100644 --- a/tests/optimagic/benchmarking/test_cartis_roberts.py +++ b/tests/optimagic/benchmarking/test_cartis_roberts.py @@ -10,7 +10,7 @@ @pytest.mark.parametrize("name, specification", list(CARTIS_ROBERTS_PROBLEMS.items())) def test_cartis_roberts_function_at_start_x(name, specification): # noqa: ARG001 - _criterion = specification["criterion"] + _criterion = specification["fun"] _x = np.array(specification["start_x"]) assert isinstance(specification["start_x"], list) _contributions = _criterion(_x) @@ -22,7 +22,7 @@ def test_cartis_roberts_function_at_start_x(name, specification): # noqa: ARG00 @pytest.mark.parametrize("name, specification", list(CARTIS_ROBERTS_PROBLEMS.items())) def test_cartis_roberts_function_at_solution_x(name, specification): # noqa: ARG001 - _criterion = specification["criterion"] + _criterion = specification["fun"] _x = specification["solution_x"] if _x is not None: assert isinstance(_x, list) diff --git a/tests/optimagic/benchmarking/test_get_benchmark_problems.py b/tests/optimagic/benchmarking/test_get_benchmark_problems.py index aa628a92b..d08fbdae0 100644 --- a/tests/optimagic/benchmarking/test_get_benchmark_problems.py +++ b/tests/optimagic/benchmarking/test_get_benchmark_problems.py @@ -26,7 +26,7 @@ def test_get_problems(name, additive_noise, multiplicative_noise, scaling): ) first_name = list(problems)[0] first = problems[first_name] - func = first["inputs"]["criterion"] + func = first["inputs"]["fun"] params = first["inputs"]["params"] first_eval = func(params)["value"] diff --git a/tests/optimagic/benchmarking/test_more_wild.py b/tests/optimagic/benchmarking/test_more_wild.py index 0e3b6c697..b7427cca0 100644 --- a/tests/optimagic/benchmarking/test_more_wild.py +++ b/tests/optimagic/benchmarking/test_more_wild.py @@ -8,7 +8,7 @@ @pytest.mark.parametrize("name, specification", list(MORE_WILD_PROBLEMS.items())) def test_more_wild_function_at_start_x(name, specification): # noqa: ARG001 - _criterion = specification["criterion"] + _criterion = specification["fun"] assert isinstance(specification["start_x"], list) _x = np.array(specification["start_x"]) _contributions = _criterion(_x) diff --git a/tests/optimagic/benchmarking/test_run_benchmark.py b/tests/optimagic/benchmarking/test_run_benchmark.py index 9b0a1d3f0..aa32a293b 100644 --- a/tests/optimagic/benchmarking/test_run_benchmark.py +++ b/tests/optimagic/benchmarking/test_run_benchmark.py @@ -91,8 +91,8 @@ def get_benchmark_problems_custom(raw_problems, internal_criterion): "inputs": inputs, "solution": _create_problem_solution_custom(specification), "info": specification.get("info", {}), - "noise_free_criterion": partial( - internal_criterion, criterion=specification["criterion"] + "noise_free_fun": partial( + internal_criterion, criterion=specification["fun"] ), "noisy": False, } @@ -103,11 +103,11 @@ def get_benchmark_problems_custom(raw_problems, internal_criterion): def _create_problem_inputs_custom(specification, internal_criterion_func): _criterion = partial( internal_criterion_func, - criterion=specification["criterion"], + criterion=specification["fun"], ) _params = specification["start_x"] - inputs = {"criterion": _criterion, "params": _params} + inputs = {"fun": _criterion, "params": _params} return inputs @@ -155,14 +155,14 @@ def _internal_criterion_dict(params, criterion): problems_pandas_input = { "linear_full_rank_good_start": { - "criterion": partial(linear_full_rank, dim_out=45), + "fun": partial(linear_full_rank, dim_out=45), "start_x": pd.DataFrame(np.ones(9), columns=["value"]), "solution_x": pd.DataFrame(linear_full_rank_solution_x, columns=["value"]), "start_criterion": 72, "solution_criterion": 36, }, "rosenbrock_good_start": { - "criterion": rosenbrock, + "fun": rosenbrock, "start_x": pd.DataFrame([-1.2, 1], columns=["value"]), "solution_x": pd.DataFrame(np.ones(2), columns=["value"]), "start_criterion": 24.2, @@ -173,7 +173,7 @@ def _internal_criterion_dict(params, criterion): prolems_dict_input = { "linear_full_rank_good_start": { - "criterion": partial(linear_full_rank, dim_out=45), + "fun": partial(linear_full_rank, dim_out=45), "start_x": {"a": 1, "b": np.ones((2, 2, 2))}, "solution_x": { "a": linear_full_rank_solution_x[0], @@ -183,7 +183,7 @@ def _internal_criterion_dict(params, criterion): "solution_criterion": 36, }, "rosenbrock_good_start": { - "criterion": rosenbrock, + "fun": rosenbrock, "start_x": {"a": np.array([-1.2, 1])}, "solution_x": {"a": np.ones(2)}, "start_criterion": 24.2, diff --git a/tests/optimagic/optimization/test_multistart.py b/tests/optimagic/optimization/test_multistart.py index 5d1be2209..75baac237 100644 --- a/tests/optimagic/optimization/test_multistart.py +++ b/tests/optimagic/optimization/test_multistart.py @@ -222,7 +222,7 @@ def ackley(x): dim = 5 kwargs = { - "criterion": ackley, + "fun": ackley, "params": np.full(dim, -10), "lower_bounds": np.full(dim, -32), "upper_bounds": np.full(dim, 32), From d781907b3e78b021cd317bdb870ed7835fa85584 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Wed, 17 Jul 2024 14:19:54 +0200 Subject: [PATCH 07/25] Add tests for deprecations. --- tests/test_deprecations.py | 67 ++++++++++++++++++++++++++++++++++++++ 1 file changed, 67 insertions(+) diff --git a/tests/test_deprecations.py b/tests/test_deprecations.py index be1d7d465..6a2998126 100644 --- a/tests/test_deprecations.py +++ b/tests/test_deprecations.py @@ -275,3 +275,70 @@ def test_estimagic_params_plot_is_deprecated(): res = om.minimize(lambda x: x @ x, np.arange(3), algorithm="scipy_lbfgsb") with pytest.warns(FutureWarning, match=msg): params_plot(res) + + +def test_criterion_is_depracated(): + msg = "the `criterion` argument has been renamed" + with pytest.warns(FutureWarning, match=msg): + om.minimize( + criterion=lambda x: x @ x, + params=np.arange(3), + algorithm="scipy_lbfgsb", + ) + + +def test_criterion_kwargs_is_deprecated(): + msg = "the `criterion_kwargs` argument has been renamed" + with pytest.warns(FutureWarning, match=msg): + om.minimize( + lambda x, a: x @ x, + params=np.arange(3), + algorithm="scipy_lbfgsb", + criterion_kwargs={"a": 1}, + ) + + +def test_derivative_is_deprecated(): + msg = "the `derivative` argument has been renamed" + with pytest.warns(FutureWarning, match=msg): + om.minimize( + lambda x: x @ x, + params=np.arange(3), + algorithm="scipy_lbfgsb", + derivative=lambda x: 2 * x, + ) + + +def test_derivative_kwargs_is_deprecated(): + msg = "the `derivative_kwargs` argument has been renamed" + with pytest.warns(FutureWarning, match=msg): + om.minimize( + lambda x: x @ x, + params=np.arange(3), + algorithm="scipy_lbfgsb", + jac=lambda x, a: 2 * x, + derivative_kwargs={"a": 1}, + ) + + +def test_criterion_and_derivative_is_deprecated(): + msg = "the `criterion_and_derivative` argument has been renamed" + with pytest.warns(FutureWarning, match=msg): + om.minimize( + lambda x: x @ x, + params=np.arange(3), + algorithm="scipy_lbfgsb", + criterion_and_derivative=lambda x: (x @ x, 2 * x), + ) + + +def test_criterion_and_derivative_kwargs_is_deprecated(): + msg = "the `criterion_and_derivative_kwargs` argument has been renamed" + with pytest.warns(FutureWarning, match=msg): + om.minimize( + lambda x: x @ x, + params=np.arange(3), + algorithm="scipy_lbfgsb", + fun_and_jac=lambda x, a: (x @ x, 2 * x), + criterion_and_derivative_kwargs={"a": 1}, + ) From 64cf934d3a947b3c1b044286aa5009eca2329aaa Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Wed, 17 Jul 2024 14:46:56 +0200 Subject: [PATCH 08/25] Add x0 as alias for params. --- src/optimagic/exceptions.py | 4 ++ src/optimagic/optimization/optimize.py | 27 +++++++++++- .../optimization/test_scipy_aliases.py | 43 +++++++++++++++++++ 3 files changed, 73 insertions(+), 1 deletion(-) create mode 100644 tests/optimagic/optimization/test_scipy_aliases.py diff --git a/src/optimagic/exceptions.py b/src/optimagic/exceptions.py index 559a14532..6d63a7de0 100644 --- a/src/optimagic/exceptions.py +++ b/src/optimagic/exceptions.py @@ -27,6 +27,10 @@ class MissingInputError(OptimagicError): """Exception for missing user provided input.""" +class AliasError(OptimagicError): + """Exception for aliasing errors.""" + + class InvalidKwargsError(OptimagicError): """Exception for invalid user provided keyword arguments.""" diff --git a/src/optimagic/optimization/optimize.py b/src/optimagic/optimization/optimize.py index 1bf25b03b..2ccde1bae 100644 --- a/src/optimagic/optimization/optimize.py +++ b/src/optimagic/optimization/optimize.py @@ -7,6 +7,7 @@ InvalidFunctionError, InvalidKwargsError, MissingInputError, + AliasError, ) from optimagic.logging.create_tables import ( make_optimization_iteration_table, @@ -63,6 +64,8 @@ def maximize( multistart_options=None, collect_history=True, skip_checks=False, + # scipy aliases + x0=None, # deprecated arguments criterion=None, criterion_kwargs=None, @@ -99,6 +102,8 @@ def maximize( multistart_options=multistart_options, collect_history=collect_history, skip_checks=skip_checks, + # scipy aliases + x0=x0, # deprecated arguments criterion=criterion, criterion_kwargs=criterion_kwargs, @@ -136,6 +141,8 @@ def minimize( multistart_options=None, collect_history=True, skip_checks=False, + # scipy aliases + x0=None, # deprecated arguments criterion=None, criterion_kwargs=None, @@ -173,6 +180,8 @@ def minimize( multistart_options=multistart_options, collect_history=collect_history, skip_checks=skip_checks, + # scipy aliases + x0=x0, # deprecated arguments criterion=criterion, criterion_kwargs=criterion_kwargs, @@ -211,6 +220,8 @@ def _optimize( multistart_options, collect_history, skip_checks, + # scipy aliases + x0, # deprecated arguments criterion, criterion_kwargs, @@ -239,7 +250,7 @@ def _optimize( ) raise MissingInputError(msg) - if params is None: + if params is None and x0 is None: msg = ( "Missing start parameters. Please provide start parameters as the second " "positional argument or as the keyword argument `params`." @@ -328,6 +339,20 @@ def _optimize( if fun_and_jac_kwargs is None: fun_and_jac_kwargs = criterion_and_derivative_kwargs + # ================================================================================== + # handle scipy aliases + # ================================================================================== + + if x0 is not None: + if params is not None: + msg = ( + "x0 is an alias for params (for better compatibility with scipy). " + "Do not use both x0 and params." + ) + raise AliasError(msg) + else: + params = x0 + # ================================================================================== # Set default values and check options # ================================================================================== diff --git a/tests/optimagic/optimization/test_scipy_aliases.py b/tests/optimagic/optimization/test_scipy_aliases.py new file mode 100644 index 000000000..ea035d117 --- /dev/null +++ b/tests/optimagic/optimization/test_scipy_aliases.py @@ -0,0 +1,43 @@ +import optimagic as om +import numpy as np +from numpy.testing import assert_array_almost_equal as aaae +from optimagic.exceptions import AliasError +import pytest + + +def test_x0_works_in_minimize(): + res = om.minimize( + fun=lambda x: x @ x, + x0=np.arange(3), + algorithm="scipy_lbfgsb", + ) + aaae(res.params, np.zeros(3)) + + +def test_x0_works_in_maximize(): + res = om.maximize( + fun=lambda x: -x @ x, + x0=np.arange(3), + algorithm="scipy_lbfgsb", + ) + aaae(res.params, np.zeros(3)) + + +def test_x0_and_params_do_not_work_together_in_minimize(): + with pytest.raises(AliasError, match="x0 is an alias"): + om.minimize( + fun=lambda x: x @ x, + x0=np.arange(3), + params=np.arange(3), + algorithm="scipy_lbfgsb", + ) + + +def test_x0_and_params_do_not_work_together_in_maximize(): + with pytest.raises(AliasError, match="x0 is an alias"): + om.maximize( + fun=lambda x: -x @ x, + x0=np.arange(3), + params=np.arange(3), + algorithm="scipy_lbfgsb", + ) From a5db76d92e75456e161df47401015ef0c061d709 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Wed, 17 Jul 2024 15:09:40 +0200 Subject: [PATCH 09/25] Add method as partial alias for algorithm. --- src/optimagic/optimization/optimize.py | 18 ++++++- src/optimagic/optimization/scipy_aliases.py | 43 +++++++++++++++ .../optimization/test_scipy_aliases.py | 54 +++++++++++++++++++ 3 files changed, 114 insertions(+), 1 deletion(-) create mode 100644 src/optimagic/optimization/scipy_aliases.py diff --git a/src/optimagic/optimization/optimize.py b/src/optimagic/optimization/optimize.py index 2ccde1bae..d2ba64662 100644 --- a/src/optimagic/optimization/optimize.py +++ b/src/optimagic/optimization/optimize.py @@ -35,6 +35,7 @@ ) from optimagic.parameters.nonlinear_constraints import process_nonlinear_constraints from optimagic.shared.process_user_function import process_func_of_params +from optimagic.optimization.scipy_aliases import map_method_to_algorithm def maximize( @@ -66,6 +67,7 @@ def maximize( skip_checks=False, # scipy aliases x0=None, + method=None, # deprecated arguments criterion=None, criterion_kwargs=None, @@ -104,6 +106,7 @@ def maximize( skip_checks=skip_checks, # scipy aliases x0=x0, + method=method, # deprecated arguments criterion=criterion, criterion_kwargs=criterion_kwargs, @@ -143,6 +146,7 @@ def minimize( skip_checks=False, # scipy aliases x0=None, + method=None, # deprecated arguments criterion=None, criterion_kwargs=None, @@ -182,6 +186,7 @@ def minimize( skip_checks=skip_checks, # scipy aliases x0=x0, + method=method, # deprecated arguments criterion=criterion, criterion_kwargs=criterion_kwargs, @@ -222,6 +227,7 @@ def _optimize( skip_checks, # scipy aliases x0, + method, # deprecated arguments criterion, criterion_kwargs, @@ -257,7 +263,7 @@ def _optimize( ) raise MissingInputError(msg) - if algorithm is None: + if algorithm is None and method is None: msg = ( "Missing algorithm. Please provide an algorithm as the third positional " "argument or as the keyword argument `algorithm`." @@ -353,6 +359,16 @@ def _optimize( else: params = x0 + if method is not None: + if algorithm is not None: + msg = ( + "method is an alias for algorithm to select the scipy optimizers under " + "their original name. Do not use both method and algorithm." + ) + raise AliasError(msg) + else: + algorithm = map_method_to_algorithm(method) + # ================================================================================== # Set default values and check options # ================================================================================== diff --git a/src/optimagic/optimization/scipy_aliases.py b/src/optimagic/optimization/scipy_aliases.py new file mode 100644 index 000000000..434e6f5e6 --- /dev/null +++ b/src/optimagic/optimization/scipy_aliases.py @@ -0,0 +1,43 @@ +from optimagic.utilities import propose_alternatives + + +def map_method_to_algorithm(method): + implemented = { + "Nelder-Mead": "scipy_neldermead", + "Powell": "scipy_powell", + "CG": "scipy_conjugate_gradient", + "BFGS": "scipy_bfgs", + "Newton-CG": "scipy_newton_cg", + "L-BFGS-B": "scipy_lbfgsb", + "TNC": "scipy_truncated_newton", + "COBYLA": "scipy_cobyla", + "SLSQP": "scipy_slsqp", + "trust-constr": "scipy_trust_constr", + } + + not_implemented = { + "dogleg": "scipy_dogleg", + "trust-ncg": "scipy_trust_ncg", + "trust-exact": "scipy_trust_exact", + "trust-krylov": "scipy_trust_krylov", + "COBYQA": "scipy_cobyqa", + } + + if method in implemented: + algo = implemented[method] + elif method in not_implemented: + msg = ( + f"The method {method} is not yet wrapped in optimagic. Create an issue on " + "https://github.com/OpenSourceEconomics/optimagic/ if you have urgent need " + "for this method." + ) + raise NotImplementedError(msg) + else: + alt = propose_alternatives(method, list(implemented) + list(not_implemented)) + msg = ( + "method is an alias for algorithm to select the scipy optimizers under " + f"their original name. {method} is not a valid scipy algorithm name. " + f"Did you mean {alt}?" + ) + raise ValueError(msg) + return algo diff --git a/tests/optimagic/optimization/test_scipy_aliases.py b/tests/optimagic/optimization/test_scipy_aliases.py index ea035d117..99dea7f85 100644 --- a/tests/optimagic/optimization/test_scipy_aliases.py +++ b/tests/optimagic/optimization/test_scipy_aliases.py @@ -41,3 +41,57 @@ def test_x0_and_params_do_not_work_together_in_maximize(): params=np.arange(3), algorithm="scipy_lbfgsb", ) + + +METHODS = [ + "Nelder-Mead", + "Powell", + "CG", + "BFGS", + "Newton-CG", + "L-BFGS-B", + "TNC", + "COBYLA", + "SLSQP", + "trust-constr", +] + + +@pytest.mark.parametrize("method", METHODS) +def test_method_works_in_minimize(method): + res = om.minimize( + fun=lambda x: x @ x, + x0=np.arange(3), + method="L-BFGS-B", + ) + aaae(res.params, np.zeros(3)) + + +@pytest.mark.parametrize("method", METHODS) +def test_method_works_in_maximize(method): + res = om.maximize( + fun=lambda x: -x @ x, + x0=np.arange(3), + method="L-BFGS-B", + ) + aaae(res.params, np.zeros(3)) + + +def test_method_and_algorithm_do_not_work_together_in_minimize(): + with pytest.raises(AliasError, match="method is an alias"): + om.minimize( + fun=lambda x: x @ x, + x0=np.arange(3), + algorithm="scipy_lbfgsb", + method="L-BFGS-B", + ) + + +def test_method_and_algorithm_do_not_work_together_in_maximize(): + with pytest.raises(AliasError, match="method is an alias"): + om.maximize( + fun=lambda x: -x @ x, + x0=np.arange(3), + algorithm="scipy_lbfgsb", + method="L-BFGS-B", + ) From 8c34407b474181ff12531530d75bc893fb4b85d1 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Wed, 17 Jul 2024 15:32:36 +0200 Subject: [PATCH 10/25] Fix. --- pyproject.toml | 1 + 1 file changed, 1 insertion(+) diff --git a/pyproject.toml b/pyproject.toml index 357cf0460..396fe85be 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -161,6 +161,7 @@ module = [ "optimagic.optimization.process_multistart_sample", "optimagic.optimization.process_results", "optimagic.optimization.tiktak", + "optimagic.optimization.scipy_aliases", "optimagic.optimizers._pounders", "optimagic.optimizers._pounders.pounders_auxiliary", From f24100e08be53365d042125457e8ebe44305370c Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Thu, 18 Jul 2024 10:16:54 +0200 Subject: [PATCH 11/25] Add error handling for non-supported and not-yet supported scipy arguments. --- src/optimagic/optimization/optimize.py | 84 +++++++++++++++++++ .../optimization/test_scipy_aliases.py | 55 ++++++++++++ 2 files changed, 139 insertions(+) diff --git a/src/optimagic/optimization/optimize.py b/src/optimagic/optimization/optimize.py index d2ba64662..2cc45bc5c 100644 --- a/src/optimagic/optimization/optimize.py +++ b/src/optimagic/optimization/optimize.py @@ -68,6 +68,13 @@ def maximize( # scipy aliases x0=None, method=None, + # scipy arguments that are not yet supported + hess=None, + hessp=None, + callback=None, + # scipy arguments that will never be supported + options=None, + tol=None, # deprecated arguments criterion=None, criterion_kwargs=None, @@ -107,6 +114,13 @@ def maximize( # scipy aliases x0=x0, method=method, + # scipy arguments that are not yet supported + hess=hess, + hessp=hessp, + callback=callback, + # scipy arguments that will never be supported + options=options, + tol=tol, # deprecated arguments criterion=criterion, criterion_kwargs=criterion_kwargs, @@ -147,6 +161,13 @@ def minimize( # scipy aliases x0=None, method=None, + # scipy arguments that are not yet supported + hess=None, + hessp=None, + callback=None, + # scipy arguments that will never be supported + options=None, + tol=None, # deprecated arguments criterion=None, criterion_kwargs=None, @@ -187,6 +208,13 @@ def minimize( # scipy aliases x0=x0, method=method, + # scipy arguments that are not yet supported + hess=hess, + hessp=hessp, + callback=callback, + # scipy arguments that will never be supported + options=options, + tol=tol, # deprecated arguments criterion=criterion, criterion_kwargs=criterion_kwargs, @@ -228,6 +256,13 @@ def _optimize( # scipy aliases x0, method, + # scipy arguments that are not yet supported + hess, + hessp, + callback, + # scipy arguments that will never be supported + options, + tol, # deprecated arguments criterion, criterion_kwargs, @@ -369,6 +404,55 @@ def _optimize( else: algorithm = map_method_to_algorithm(method) + # ================================================================================== + # Handle scipy arguments that are not yet implemented + # ================================================================================== + + if hess is not None: + msg = ( + "The hess argument is not yet supported in optimagic. Creat an issue on " + "https://github.com/OpenSourceEconomics/optimagic/ if you have urgent need " + "for this feature." + ) + raise NotImplementedError(msg) + + if hessp is not None: + msg = ( + "The hessp argument is not yet supported in optimagic. Creat an issue on " + "https://github.com/OpenSourceEconomics/optimagic/ if you have urgent need " + "for this feature." + ) + raise NotImplementedError(msg) + + if callback is not None: + msg = ( + "The callback argument is not yet supported in optimagic. Creat an issue " + "on https://github.com/OpenSourceEconomics/optimagic/ if you have urgent " + "need for this feature." + ) + raise NotImplementedError(msg) + + # ================================================================================== + # Handle scipy arguments that will never be supported + # ================================================================================== + + if options is not None: + # TODO: Add link to a how-to guide or tutorial for this + msg = ( + "The options argument is not supported in optimagic. Please use the " + "algo_options argument instead." + ) + raise NotImplementedError(msg) + + if tol is not None: + # TODO: Add link to a how-to guide or tutorial for this + msg = ( + "The tol argument is not supported in optimagic. Please use " + "algo_options or configured algorithms instead to set convergence criteria " + "for your optimizer." + ) + raise NotImplementedError(msg) + # ================================================================================== # Set default values and check options # ================================================================================== diff --git a/tests/optimagic/optimization/test_scipy_aliases.py b/tests/optimagic/optimization/test_scipy_aliases.py index 99dea7f85..86cdd0ed3 100644 --- a/tests/optimagic/optimization/test_scipy_aliases.py +++ b/tests/optimagic/optimization/test_scipy_aliases.py @@ -95,3 +95,58 @@ def test_method_and_algorithm_do_not_work_together_in_maximize(): algorithm="scipy_lbfgsb", method="L-BFGS-B", ) + + +def test_exception_for_hess(): + msg = "The hess argument is not yet supported" + with pytest.raises(NotImplementedError, match=msg): + om.minimize( + fun=lambda x: x @ x, + x0=np.arange(3), + algorithm="scipy_lbfgsb", + hess=lambda x: np.eye(len(x)), + ) + + +def test_exception_for_hessp(): + msg = "The hessp argument is not yet supported" + with pytest.raises(NotImplementedError, match=msg): + om.minimize( + fun=lambda x: x @ x, + x0=np.arange(3), + algorithm="scipy_lbfgsb", + hessp=lambda x, p: np.eye(len(x)) @ p, + ) + + +def test_exception_for_callback(): + msg = "The callback argument is not yet supported" + with pytest.raises(NotImplementedError, match=msg): + om.minimize( + fun=lambda x: x @ x, + x0=np.arange(3), + algorithm="scipy_lbfgsb", + callback=lambda x: print(x), + ) + + +def test_exception_for_options(): + msg = "The options argument is not supported" + with pytest.raises(NotImplementedError, match=msg): + om.minimize( + fun=lambda x: x @ x, + x0=np.arange(3), + algorithm="scipy_lbfgsb", + options={"maxiter": 100}, + ) + + +def test_exception_for_tol(): + msg = "The tol argument is not supported" + with pytest.raises(NotImplementedError, match=msg): + om.minimize( + fun=lambda x: x @ x, + x0=np.arange(3), + algorithm="scipy_lbfgsb", + tol=1e-6, + ) From 9ae006e35bc4f3b15b0b7319743938e167e3a44f Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Thu, 18 Jul 2024 10:47:10 +0200 Subject: [PATCH 12/25] Add support for args. --- src/optimagic/optimization/optimize.py | 27 +++++++++++++++- src/optimagic/shared/process_user_function.py | 17 ++++++++++ .../optimization/test_scipy_aliases.py | 31 +++++++++++++++++++ tests/optimagic/test_process_function.py | 15 ++++++++- 4 files changed, 88 insertions(+), 2 deletions(-) diff --git a/src/optimagic/optimization/optimize.py b/src/optimagic/optimization/optimize.py index 2cc45bc5c..20f6c5302 100644 --- a/src/optimagic/optimization/optimize.py +++ b/src/optimagic/optimization/optimize.py @@ -34,7 +34,10 @@ get_converter, ) from optimagic.parameters.nonlinear_constraints import process_nonlinear_constraints -from optimagic.shared.process_user_function import process_func_of_params +from optimagic.shared.process_user_function import ( + process_func_of_params, + get_kwargs_from_args, +) from optimagic.optimization.scipy_aliases import map_method_to_algorithm @@ -68,6 +71,7 @@ def maximize( # scipy aliases x0=None, method=None, + args=None, # scipy arguments that are not yet supported hess=None, hessp=None, @@ -114,6 +118,7 @@ def maximize( # scipy aliases x0=x0, method=method, + args=args, # scipy arguments that are not yet supported hess=hess, hessp=hessp, @@ -161,6 +166,7 @@ def minimize( # scipy aliases x0=None, method=None, + args=None, # scipy arguments that are not yet supported hess=None, hessp=None, @@ -208,6 +214,7 @@ def minimize( # scipy aliases x0=x0, method=method, + args=args, # scipy arguments that are not yet supported hess=hess, hessp=hessp, @@ -256,6 +263,7 @@ def _optimize( # scipy aliases x0, method, + args, # scipy arguments that are not yet supported hess, hessp, @@ -404,6 +412,23 @@ def _optimize( else: algorithm = map_method_to_algorithm(method) + if args is not None: + if ( + fun_kwargs is not None + or jac_kwargs is not None + or fun_and_jac_kwargs is not None + ): + msg = ( + "args is an alternative to fun_kwargs, jac_kwargs and " + "fun_and_jac_kwargs that optimagic supports for compatibility " + "with scipy. Do not use args in conjunction with any of the other " + "arguments." + ) + raise AliasError(msg) + else: + kwargs = get_kwargs_from_args(args, fun, offset=1) + fun_kwargs, jac_kwargs, fun_and_jac_kwargs = kwargs, kwargs, kwargs + # ================================================================================== # Handle scipy arguments that are not yet implemented # ================================================================================== diff --git a/src/optimagic/shared/process_user_function.py b/src/optimagic/shared/process_user_function.py index f53e7e57d..3a4471570 100644 --- a/src/optimagic/shared/process_user_function.py +++ b/src/optimagic/shared/process_user_function.py @@ -91,3 +91,20 @@ def get_arguments_without_default(func): no_default = set(no_default) return no_default + + +def get_kwargs_from_args(args, func, offset=0): + """Convert positional arguments to a dict of keyword arguments. + + Args: + args (list, tuple): Positional arguments. + func (callable): Function to be called. + offset (int, optional): Number of arguments to skip. Defaults to 0. + + Returns: + dict: Keyword arguments. + + """ + names = list(inspect.signature(func).parameters)[offset:] + kwargs = {name: arg for name, arg in zip(names, args)} + return kwargs diff --git a/tests/optimagic/optimization/test_scipy_aliases.py b/tests/optimagic/optimization/test_scipy_aliases.py index 86cdd0ed3..022e7907f 100644 --- a/tests/optimagic/optimization/test_scipy_aliases.py +++ b/tests/optimagic/optimization/test_scipy_aliases.py @@ -150,3 +150,34 @@ def test_exception_for_tol(): algorithm="scipy_lbfgsb", tol=1e-6, ) + + +def test_args_works_in_minimize(): + res = om.minimize( + fun=lambda x, a: ((x - a) ** 2).sum(), + x0=np.arange(3), + args=(1,), + algorithm="scipy_lbfgsb", + ) + aaae(res.params, np.ones(3)) + + +def test_args_works_in_maximize(): + res = om.maximize( + fun=lambda x, a: -((x - a) ** 2).sum(), + x0=np.arange(3), + args=(1,), + algorithm="scipy_lbfgsb", + ) + aaae(res.params, np.ones(3)) + + +def test_args_does_not_work_with_together_with_any_kwargs(): + with pytest.raises(AliasError, match="args is an alternative"): + om.minimize( + fun=lambda x, a: ((x - a) ** 2).sum(), + params=np.arange(3), + algorithm="scipy_lbfgsb", + args=(1,), + fun_kwargs={"a": 1}, + ) diff --git a/tests/optimagic/test_process_function.py b/tests/optimagic/test_process_function.py index 6c4cfdff7..44d67defd 100644 --- a/tests/optimagic/test_process_function.py +++ b/tests/optimagic/test_process_function.py @@ -1,6 +1,9 @@ import pytest from optimagic.exceptions import InvalidKwargsError -from optimagic.shared.process_user_function import process_func_of_params +from optimagic.shared.process_user_function import ( + process_func_of_params, + get_kwargs_from_args, +) def test_process_func_of_params(): @@ -26,3 +29,13 @@ def f(params, b, c): with pytest.raises(InvalidKwargsError): process_func_of_params(f, {"c": 3}) + + +def test_get_kwargs_from_args(): + def f(a, b, c=3, d=4): + return a + b + c + + got = get_kwargs_from_args([1, 2], f, offset=1) + expected = {"b": 1, "c": 2} + + assert got == expected From fe5bbffd0a7bf65affb4b0022c807d459dd71eea Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Thu, 18 Jul 2024 10:49:38 +0200 Subject: [PATCH 13/25] Move test file. --- tests/optimagic/shared/__init__.py | 0 tests/optimagic/{ => shared}/test_process_function.py | 0 2 files changed, 0 insertions(+), 0 deletions(-) create mode 100644 tests/optimagic/shared/__init__.py rename tests/optimagic/{ => shared}/test_process_function.py (100%) diff --git a/tests/optimagic/shared/__init__.py b/tests/optimagic/shared/__init__.py new file mode 100644 index 000000000..e69de29bb diff --git a/tests/optimagic/test_process_function.py b/tests/optimagic/shared/test_process_function.py similarity index 100% rename from tests/optimagic/test_process_function.py rename to tests/optimagic/shared/test_process_function.py From 5e69049ab9bc3698b0beecdc5d93b2988dec3be2 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Thu, 18 Jul 2024 13:58:20 +0200 Subject: [PATCH 14/25] Restructure deprecation code. --- pyproject.toml | 1 + src/optimagic/deprecations.py | 60 +++++++++++++++++++++ src/optimagic/optimization/optimize.py | 74 ++++++-------------------- 3 files changed, 77 insertions(+), 58 deletions(-) create mode 100644 src/optimagic/deprecations.py diff --git a/pyproject.toml b/pyproject.toml index 396fe85be..4d211ac7e 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -224,6 +224,7 @@ module = [ "optimagic.decorators", "optimagic.exceptions", "optimagic.utilities", + "optimagic.deprecations", "estimagic", "estimagic.examples", diff --git a/src/optimagic/deprecations.py b/src/optimagic/deprecations.py new file mode 100644 index 000000000..f99644864 --- /dev/null +++ b/src/optimagic/deprecations.py @@ -0,0 +1,60 @@ +import warnings + + +def throw_criterion_future_warning(): + msg = ( + "To align optimagic with scipy.optimize, the `criterion` argument has been " + "renamed to `fun`. Please use `fun` instead of `criterion`. Using `criterion` " + " will become an error in optimagic version 0.6.0 and later." + ) + warnings.warn(msg, FutureWarning) + + +def throw_criterion_kwargs_future_warning(): + msg = ( + "To align optimagic with scipy.optimize, the `criterion_kwargs` argument has " + "been renamed to `fun_kwargs`. Please use `fun_kwargs` instead of " + "`criterion_kwargs`. Using `criterion_kwargs` will become an error in " + "optimagic version 0.6.0 and later." + ) + warnings.warn(msg, FutureWarning) + + +def throw_derivative_future_warning(): + msg = ( + "To align optimagic with scipy.optimize, the `derivative` argument has been " + "renamed to `jac`. Please use `jac` instead of `derivative`. Using `derivative`" + " will become an error in optimagic version 0.6.0 and later." + ) + warnings.warn(msg, FutureWarning) + + +def throw_derivative_kwargs_future_warning(): + msg = ( + "To align optimagic with scipy.optimize, the `derivative_kwargs` argument has " + "been renamed to `jac_kwargs`. Please use `jac_kwargs` instead of " + "`derivative_kwargs`. Using `derivative_kwargs` will become an error in " + "optimagic version 0.6.0 and later." + ) + warnings.warn(msg, FutureWarning) + + +def throw_criterion_and_derivative_future_warning(): + msg = ( + "To align optimagic with scipy.optimize, the `criterion_and_derivative` " + "argument has been renamed to `fun_and_jac`. Please use `fun_and_jac` " + "instead of `criterion_and_derivative`. Using `criterion_and_derivative` " + "will become an error in optimagic version 0.6.0 and later." + ) + warnings.warn(msg, FutureWarning) + + +def throw_criterion_and_derivative_kwargs_future_warning(): + msg = ( + "To align optimagic with scipy.optimize, the `criterion_and_derivative_kwargs` " + "argument has been renamed to `fun_and_jac_kwargs`. Please use " + "`fun_and_jac_kwargs` instead of `criterion_and_derivative_kwargs`. Using " + "`criterion_and_derivative_kwargs` will become an error in optimagic version " + "0.6.0 and later." + ) + warnings.warn(msg, FutureWarning) diff --git a/src/optimagic/optimization/optimize.py b/src/optimagic/optimization/optimize.py index 20f6c5302..c0d06957c 100644 --- a/src/optimagic/optimization/optimize.py +++ b/src/optimagic/optimization/optimize.py @@ -39,6 +39,7 @@ get_kwargs_from_args, ) from optimagic.optimization.scipy_aliases import map_method_to_algorithm +from optimagic import deprecations def maximize( @@ -318,75 +319,32 @@ def _optimize( # ================================================================================== if criterion is not None: - msg = ( - "To align optimagic with scipy.optimize, the `criterion` argument has been " - "renamed to `fun`. Please use `fun` instead of `criterion`. Using " - "`criterion` will become an error in optimagic version 0.6.0 and later." - ) - warnings.warn(msg, FutureWarning) - - if fun is None: - fun = criterion + deprecations.throw_criterion_future_warning() + fun = criterion if fun is None else fun if criterion_kwargs is not None: - msg = ( - "To align optimagic with scipy.optimize, the `criterion_kwargs` argument " - "has been renamed to `fun_kwargs`. Please use `fun_kwargs` instead of " - "`criterion_kwargs`. Using `criterion_kwargs` will become an error in " - "optimagic version 0.6.0 and later." - ) - warnings.warn(msg, FutureWarning) - - if fun_kwargs is None: - fun_kwargs = criterion_kwargs + deprecations.throw_criterion_kwargs_future_warning() + fun_kwargs = criterion_kwargs if fun_kwargs is None else fun_kwargs if derivative is not None: - msg = ( - "To align optimagic with scipy.optimize, the `derivative` argument has " - "been renamed to `jac`. Please use `jac` instead of `derivative`. Using " - "`derivative` will become an error in optimagic version 0.6.0 and later." - ) - warnings.warn(msg, FutureWarning) - - if jac is None: - jac = derivative + deprecations.throw_derivative_future_warning() + jac = derivative if jac is None else jac if derivative_kwargs is not None: - msg = ( - "To align optimagic with scipy.optimize, the `derivative_kwargs` argument " - "has been renamed to `jac_kwargs`. Please use `jac_kwargs` instead of " - "`derivative_kwargs`. Using `derivative_kwargs` will become an error in " - "optimagic version 0.6.0 and later." - ) - warnings.warn(msg, FutureWarning) - - if jac_kwargs is None: - jac_kwargs = derivative_kwargs + deprecations.throw_derivative_kwargs_future_warning() + jac_kwargs = derivative_kwargs if jac_kwargs is None else jac_kwargs if criterion_and_derivative is not None: - msg = ( - "To align optimagic with scipy.optimize, the `criterion_and_derivative` " - "argument has been renamed to `fun_and_jac`. Please use `fun_and_jac` " - "instead of `criterion_and_derivative`. Using `criterion_and_derivative` " - "will become an error in optimagic version 0.6.0 and later." - ) - warnings.warn(msg, FutureWarning) - - if fun_and_jac is None: - fun_and_jac = criterion_and_derivative + deprecations.throw_criterion_and_derivative_future_warning() + fun_and_jac = criterion_and_derivative if fun_and_jac is None else fun_and_jac if criterion_and_derivative_kwargs is not None: - msg = ( - "To align optimagic with scipy.optimize, the " - "`criterion_and_derivative_kwargs` argument has been renamed to " - "`fun_and_jac_kwargs`. Please use `fun_and_jac_kwargs` instead of " - "`criterion_and_derivative_kwargs`. Using `criterion_and_derivative_kwargs`" - " will become an error in optimagic version 0.6.0 and later." + deprecations.throw_criterion_and_derivative_kwargs_future_warning() + fun_and_jac_kwargs = ( + criterion_and_derivative_kwargs + if fun_and_jac_kwargs is None + else fun_and_jac_kwargs ) - warnings.warn(msg, FutureWarning) - - if fun_and_jac_kwargs is None: - fun_and_jac_kwargs = criterion_and_derivative_kwargs # ================================================================================== # handle scipy aliases From 5bc1bec14c81c21bb67281d91cbd6d36114d6926 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Thu, 18 Jul 2024 18:52:20 +0200 Subject: [PATCH 15/25] Basic renaming and deprecations for convergence and stopping criteria. --- docs/source/algorithms.md | 354 +++++++++--------- src/optimagic/benchmarking/run_benchmark.py | 12 +- src/optimagic/deprecations.py | 37 ++ src/optimagic/optimization/algo_options.py | 26 +- src/optimagic/optimization/optimize.py | 3 + src/optimagic/optimizers/bhhh.py | 16 +- src/optimagic/optimizers/fides.py | 36 +- src/optimagic/optimizers/ipopt.py | 18 +- src/optimagic/optimizers/nag_optimizers.py | 18 +- src/optimagic/optimizers/neldermead.py | 29 +- src/optimagic/optimizers/nlopt_optimizers.py | 340 ++++++++--------- src/optimagic/optimizers/pounders.py | 16 +- src/optimagic/optimizers/pygmo_optimizers.py | 66 ++-- src/optimagic/optimizers/scipy_optimizers.py | 202 +++++----- src/optimagic/optimizers/tao_optimizers.py | 62 +-- tests/estimagic/test_estimate_ml.py | 2 +- .../optimagic/optimization/test_multistart.py | 2 +- .../optimization/test_with_constraints.py | 4 +- tests/optimagic/optimizers/test_bhhh.py | 4 +- .../optimizers/test_fides_options.py | 12 +- .../optimizers/test_ipopt_options.py | 4 +- tests/optimagic/optimizers/test_neldermead.py | 2 +- 22 files changed, 639 insertions(+), 626 deletions(-) diff --git a/docs/source/algorithms.md b/docs/source/algorithms.md index 192070a90..c222a0566 100644 --- a/docs/source/algorithms.md +++ b/docs/source/algorithms.md @@ -43,7 +43,7 @@ install optimagic. The lbfgsb algorithm is almost perfectly scale invariant. Thus, it is not necessary to scale the parameters. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative improvement + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. More formally, this is expressed as .. math:: @@ -52,11 +52,11 @@ install optimagic. \text{relative_criterion_tolerance} - - **convergence.absolute_gradient_tolerance** (float): Stop if all elements of the projected + - **convergence.gtol_abs** (float): Stop if all elements of the projected gradient are smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. - - **stopping.max_iterations** (int): If the maximum number of iterations is reached, + - **stopping.maxiter** (int): If the maximum number of iterations is reached, the optimization stops, but we do not count this as convergence. - **limited_memory_storage_length** (int): Maximum number of saved gradients used to approximate the hessian matrix. @@ -82,9 +82,9 @@ install optimagic. .. note:: SLSQP's general nonlinear constraints are not supported yet by optimagic. - - **convergence.absolute_criterion_tolerance** (float): Precision goal for the value of + - **convergence.ftol_abs** (float): Precision goal for the value of f in the stopping criterion. - - **stopping.max_iterations** (int): If the maximum number of iterations is reached, + - **stopping.maxiter** (int): If the maximum number of iterations is reached, the optimization stops, but we do not count this as convergence. ``` @@ -112,14 +112,14 @@ install optimagic. The argument `initial_simplex` is not supported by optimagic as it is not compatible with optimagic's handling of constraints. - - **stopping.max_iterations** (int): If the maximum number of iterations is reached, the optimization stops, + - **stopping.maxiter** (int): If the maximum number of iterations is reached, the optimization stops, but we do not count this as convergence. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function evaluation is reached, + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. - - **convergence.absolute_params_tolerance** (float): Absolute difference in parameters between iterations + - **convergence.xtol_abs** (float): Absolute difference in parameters between iterations that is tolerated to declare convergence. As no relative tolerances can be passed to Nelder-Mead, optimagic sets a non zero default for this. - - **convergence.absolute_criterion_tolerance** (float): Absolute difference in the criterion value between + - **convergence.ftol_abs** (float): Absolute difference in the criterion value between iterations that is tolerated to declare convergence. As no relative tolerances can be passed to Nelder-Mead, optimagic sets a non zero default for this. - **adaptive** (bool): Adapt algorithm parameters to dimensionality of problem. @@ -151,9 +151,9 @@ install optimagic. is part of the scipy interface is not supported by optimagic because it is incompatible with how optimagic handles constraints. - - **convergence.relative_params_tolerance (float)**: Stop when the relative movement between parameter + - **convergence.xtol_rel (float)**: Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative improvement between two + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. More formally, this is expressed as .. math:: @@ -161,9 +161,9 @@ install optimagic. \frac{(f^k - f^{k+1})}{\\max{{\{|f^k|, |f^{k+1}|, 1\}}}} \leq \text{relative_criterion_tolerance} - - **stopping.max_criterion_evaluations** (int): If the maximum number of function evaluation is reached, + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count thisas convergence. - - **stopping.max_iterations** (int): If the maximum number of iterations is reached, the optimization stops, + - **stopping.maxiter** (int): If the maximum number of iterations is reached, the optimization stops, but we do not count this as convergence. ``` @@ -184,8 +184,8 @@ install optimagic. expansion near an optimum. However, BFGS can have acceptable performance even for non-smooth optimization instances. - - **convergence.absolute_gradient_tolerance** (float): Stop if all elements of the gradient are smaller than this. - - **stopping.max_iterations** (int): If the maximum number of iterations is reached, the optimization stops, + - **convergence.gtol_abs** (float): Stop if all elements of the gradient are smaller than this. + - **stopping.maxiter** (int): If the maximum number of iterations is reached, the optimization stops, but we do not count this as convergence. - **norm** (float): Order of the vector norm that is used to calculate the gradient's "score" that is compared to the gradient tolerance to determine convergence. Default is infinite which means that @@ -217,9 +217,9 @@ install optimagic. - the gradient is not too large, e.g., has a norm less than 1000. - The initial guess is reasonably close to the criterion's global minimizer. - - **convergence.absolute_gradient_tolerance** (float): Stop if all elements of the + - **convergence.gtol_abs** (float): Stop if all elements of the gradient are smaller than this. - - **stopping.max_iterations** (int): If the maximum number of iterations is reached, + - **stopping.maxiter** (int): If the maximum number of iterations is reached, the optimization stops, but we do not count this as convergence. - **norm** (float): Order of the vector norm that is used to calculate the gradient's "score" that is compared to the gradient tolerance to determine convergence. @@ -266,10 +266,10 @@ install optimagic. - the gradient is not too large, e.g., has a norm less than 1000. - The initial guess is reasonably close to the criterion's global minimizer. - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. Newton CG uses the average relative change in the parameters for determining the convergence. - - **stopping.max_iterations** (int): If the maximum number of iterations is reached, + - **stopping.maxiter** (int): If the maximum number of iterations is reached, the optimization stops, but we do not count this as convergence. @@ -296,9 +296,9 @@ install optimagic. For more information on COBYLA see :cite:`Powell1994`, :cite:`Powell1998` and :cite:`Powell2007`. - - **stopping.max_iterations** (int): If the maximum number of iterations is reached, + - **stopping.maxiter** (int): If the maximum number of iterations is reached, the optimization stops, but we do not count this as convergence. - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. In case of COBYLA this is a lower bound on the size of the trust region and can be seen as the required accuracy in the variables but this accuracy is not guaranteed. @@ -344,20 +344,20 @@ install optimagic. ``messg_num`` which is an additional way to control the verbosity of the optimizer. - **func_min_estimate** (float): Minimum function value estimate. Defaults to 0. - stopping_max_iterations (int): If the maximum number of iterations is reached, + - **stopping.maxiter** (int): If the maximum number of iterations is reached, the optimization stops, but we do not count this as convergence. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. - - **convergence.absolute_params_tolerance** (float): Absolute difference in parameters + - **convergence.xtol_abs** (float): Absolute difference in parameters between iterations after scaling that is tolerated to declare convergence. - - **convergence.absolute_criterion_tolerance** (float): Absolute difference in the + - **convergence.ftol_abs** (float): Absolute difference in the criterion value between iterations after scaling that is tolerated to declare convergence. - - **convergence.absolute_gradient_tolerance** (float): Stop if the value of the + - **convergence.gtol_abs** (float): Stop if the value of the projected gradient (after applying x scaling factors) is smaller than this. - If convergence.absolute_gradient_tolerance < 0.0, - convergence.absolute_gradient_tolerance is set to + If convergence.gtol_abs < 0.0, + convergence.gtol_abs is set to 1e-2 * sqrt(accuracy). - **max_hess_evaluations_per_iteration** (int): Maximum number of hessian*vector evaluations per main iteration. If ``max_hess_evaluations == 0``, the @@ -415,19 +415,19 @@ install optimagic. It approximates the Hessian using the Broyden-Fletcher-Goldfarb-Shanno (BFGS) Hessian update strategy. - - **convergence.absolute_gradient_tolerance** (float): Tolerance for termination + - **convergence.gtol_abs** (float): Tolerance for termination by the norm of the Lagrangian gradient. The algorithm will terminate when both the infinity norm (i.e., max abs value) of the Lagrangian gradient and the constraint violation are smaller than the - convergence.absolute_gradient_tolerance. + convergence.gtol_abs. For this algorithm we use scipy's gradient tolerance for trust_constr. This smaller tolerance is needed for the sum of squares tests to pass. - - **stopping.max_iterations** (int): If the maximum number of iterations is reached, + - **stopping.maxiter** (int): If the maximum number of iterations is reached, the optimization stops, but we do not count this as convergence. - - **convergence.relative_params_tolerance** (float): Tolerance for termination by + - **convergence.xtol_rel** (float): Tolerance for termination by the change of the independent variable. The algorithm will terminate when the radius of the trust region used in the algorithm is smaller than the - convergence.relative_params_tolerance. + convergence.xtol_rel. - **trustregion.initial_radius** (float): Initial value of the trust region radius. The trust radius gives the maximum distance between solution points in consecutive iterations. It reflects the trust the algorithm puts in the @@ -453,11 +453,11 @@ install optimagic. The algorithm supports the following options: - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is below this. - - **convergence.relative_gradient_tolerance** (float): Stop when the gradient, + - **convergence.gtol_rel** (float): Stop when the gradient, divided by the absolute value of the criterion function is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. - **tr_solver** (str): Method for solving trust-region subproblems, relevant only @@ -495,11 +495,11 @@ install optimagic. The algorithm supports the following options: - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is below this. - - **convergence.relative_gradient_tolerance** (float): Stop when the gradient, + - **convergence.gtol_rel** (float): Stop when the gradient, divided by the absolute value of the criterion function is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. - **tr_solver** (str): Method for solving trust-region subproblems, relevant only @@ -537,11 +537,11 @@ install optimagic. The algorithm supports the following options: - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is below this. - - **convergence.relative_gradient_tolerance** (float): Stop when the gradient, + - **convergence.gtol_rel** (float): Stop when the gradient, divided by the absolute value of the criterion function is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. - **tr_solver** (str): Method for solving trust-region subproblems, relevant only @@ -675,13 +675,13 @@ install optimagic. - ‘rand2bin’ - ‘rand1bin’ - - **stopping.max_iterations** (int): The maximum number of criterion evaluations - without polishing is(stopping.max_iterations + 1) * population_size * number of + - **stopping.maxiter** (int): The maximum number of criterion evaluations + without polishing is(stopping.maxiter + 1) * population_size * number of parameters - **population_size_multiplier** (int): A multiplier setting the population size. The number of individuals in the population is population_size * number of parameters. The default 15. - - **convergence.relative_criterion_tolerance** (float): Default 0.01. + - **convergence.ftol_rel** (float): Default 0.01. - **mutation_constant** (float/tuple): The differential weight denoted by F in literature. Should be within 0 and 2. The tuple form is used to specify (min, max) dithering which can help speed convergence. Default is (0.5, 1). @@ -702,7 +702,7 @@ install optimagic. number of parameters). The initial population is clipped to bounds before use. Default is 'latinhypercube' - - **convergence.absolute_criterion_tolerance** (float): + - **convergence.ftol_abs** (float): CONVERGENCE_SECOND_BEST_ABSOLUTE_CRITERION_TOLERANCE - **n_cores** (int): The number of cores on which the function is evaluated in parallel. Default 1. @@ -743,8 +743,8 @@ install optimagic. - **convergence.minimum_criterion_tolerance** (float): Specify the relative error between the current best minimum and the supplied global criterion_minimum allowed. Default is scipy's default, 1e-4. - - **stopping.max_iterations** (int): The maximum number of iterations. - - **stopping.max_criterion_evaluations** (int): The maximum number of criterion + - **stopping.maxiter** (int): The maximum number of iterations. + - **stopping.maxfun** (int): The maximum number of criterion evaluations. - **stopping.max_processing_time** (int): The maximum time allowed for the optimization. @@ -771,7 +771,7 @@ install optimagic. The algorithm supports the following options: - - **stopping.max_iterations** (int): Specify the maximum number of global searh + - **stopping.maxiter** (int): Specify the maximum number of global searh iterations. - **local_algorithm** (str): The local optimization algorithm to be used. valid options are: "Nelder-Mead", "Powell", "CG", "BFGS", "Newton-CG", "L-BFGS-B", @@ -784,7 +784,7 @@ install optimagic. - **restart_temperature_ratio** (float): Reanneling starts when the algorithm is decreased to initial_temperature * restart_temperature_ratio. Default is 2e-05. - **visit** (float): Specify the thickness of visiting distribution's tails. Range is (1, 3] and default is scipy's default, 2.62. - **accept** (float): Controls the probability of acceptance. Range is (-1e4, -5] and default is scipy's default, -5.0. Smaller values lead to lower acceptance probability. - - **stopping.max_criterion_evaluations** (int): soft limit for the number of criterion evaluations. + - **stopping.maxfun** (int): soft limit for the number of criterion evaluations. - **seed** (int, None or RNG): Dual annealing is a stochastic process. Seed or random number generator. Default None. - **no_local_search** (bool): Specify whether to apply a traditional Generalized Simulated Annealing with no local search. Default is False. @@ -803,8 +803,8 @@ install optimagic. The algorithm supports the following options: - **eps** (float): Specify the minimum difference of the criterion values between the current best hyperrectangle and the next potentially best hyperrectangle to be divided determining the trade off between global and local search. Default is 1e-6 differing from scipy's default 1e-4. - - **stopping_max_criterion_evaluations** (int/None): Maximum number of criterion evaluations allowed. Default is None which caps the number of evaluations at 1000 * number of dimentions automatically. - - **stopping_max_iterations** (int): Maximum number of iterations allowed. + - **stopping.maxfun** (int/None): Maximum number of criterion evaluations allowed. Default is None which caps the number of evaluations at 1000 * number of dimentions automatically. + - **stopping.maxiter** (int): Maximum number of iterations allowed. - **locally_biased** (bool): Determine whether to use the locally biased variant of the algorithm DIRECT_L. Default is True. - **convergence.minimum_criterion_value** (float): Specify the global minimum when it is known. Default is minus infinity. For maximization problems, flip the sign. - **convergence.minimum_criterion_tolerance** (float): Specify the relative error between the current best minimum and the supplied global criterion_minimum allowed. Default is scipy's default, 1e-4. @@ -841,9 +841,9 @@ We implement a few algorithms from scratch. They are currently considered experi bhhh supports the following options: - - **convergence_absolute_gradient_tolerance** (float): Stopping criterion for the + - **convergence.gtol_abs** (float): Stopping criterion for the gradient tolerance. Default is 1e-8. - - **stopping_max_iterations** (int): Maximum number of iterations. + - **stopping.maxiter** (int): Maximum number of iterations. If reached, terminate. Default is 200. ``` @@ -874,14 +874,14 @@ We implement a few algorithms from scratch. They are currently considered experi - **adaptive** (bool): Adjust parameters of Nelder-Mead algorithm to account for simplex size. The default is True. - - **stopping.max_iterations** (int): Maximum number of algorithm iterations. + - **stopping.maxiter** (int): Maximum number of algorithm iterations. The default is STOPPING_MAX_ITERATIONS. - - **convergence.absolute_criterion_tolerance** (float): maximal difference between + - **convergence.ftol_abs** (float): maximal difference between function value evaluated on simplex points. The default is CONVERGENCE_SECOND_BEST_ABSOLUTE_CRITERION_TOLERANCE. - - **convergence.absolute_params_tolerance** (float): maximal distance between points + - **convergence.xtol_abs** (float): maximal distance between points in the simplex. The default is CONVERGENCE_SECOND_BEST_ABSOLUTE_PARAMS_TOLERANCE. - **batch_evaluator** (string or callable): See :ref:`batch_evaluators` for @@ -921,19 +921,19 @@ We implement a few algorithms from scratch. They are currently considered experi pounders supports the following options: - - **convergence_absolute_gradient_tolerance**: Convergence tolerance for the + - **convergence.gtol_abs**: Convergence tolerance for the absolute gradient norm. Stop if norm of the gradient is less than this. Default is 1e-8. - - **convergence_relative_gradient_tolerance**: Convergence tolerance for the + - **convergence.gtol_rel**: Convergence tolerance for the relative gradient norm. Stop if norm of the gradient relative to the criterion value is less than this. Default is 1-8. - - **convergence_scaled_gradient_tolerance**: Convergence tolerance for the + - **convergence.gtol_scaled**: Convergence tolerance for the scaled gradient norm. Stop if norm of the gradient divided by norm of the gradient at the initial parameters is less than this. Disabled, i.e. set to False, by default. - **max_interpolation_points** (int): Maximum number of interpolation points. Default is `2 * n + 1`, where `n` is the length of the parameter vector. - - **stopping_max_iterations** (int): Maximum number of iterations. + - **stopping.maxiter** (int): Maximum number of iterations. If reached, terminate. Default is 2000. - **trustregion_initial_radius (float)**: Delta, initial trust-region radius. 0.1 by default. @@ -1052,17 +1052,17 @@ need to have [petsc4py](https://pypi.org/project/petsc4py/) installed. \frac{||g(X)||}{||g(X0)||} < \epsilon - - **convergence.absolute_gradient_tolerance** (float): Stop if norm of gradient is less than this. - If set to False the algorithm will not consider convergence.absolute_gradient_tolerance. - - **convergence.relative_gradient_tolerance** (float): Stop if relative norm of gradient is less + - **convergence.gtol_abs** (float): Stop if norm of gradient is less than this. + If set to False the algorithm will not consider convergence.gtol_abs. + - **convergence.gtol_rel** (float): Stop if relative norm of gradient is less than this. If set to False the algorithm will not consider - convergence.relative_gradient_tolerance. + convergence.gtol_rel. - **convergence.scaled_gradient_tolerance** (float): Stop if scaled norm of gradient is smaller than this. If set to False the algorithm will not consider convergence.scaled_gradient_tolerance. - **trustregion.initial_radius** (float): Initial value of the trust region radius. It must be :math:`> 0`. - - **stopping.max_iterations** (int): Alternative Stopping criterion. + - **stopping.maxiter** (int): Alternative Stopping criterion. If set the routine will stop after the number of specified iterations or after the step size is sufficiently small. If the variable is set the default criteria will all be ignored. @@ -1136,7 +1136,7 @@ install each of them separately: 3. when a sufficient reduction to the criterion value at the start parameters has been reached, i.e. when :math:`\frac{f(x)}{f(x_0)} \leq - \text{convergence.scaled_criterion_tolerance}` + \text{convergence.ftol_scaled}` 4. when all evaluations on the interpolation points fall within a scaled version of the noise level of the criterion function. This is only applicable if the @@ -1161,11 +1161,11 @@ install each of them separately: .. warning:: Very small values, as in most other tolerances don't make sense here. - - **convergence.scaled_criterion_tolerance** (float): + - **convergence.ftol_scaled** (float): Terminate if a point is reached where the ratio of the criterion value to the criterion value at the start params is below this value, i.e. if :math:`f(x_k)/f(x_0) \leq - \text{convergence.scaled_criterion_tolerance}`. Note this is + \text{convergence.ftol_scaled}`. Note this is deactivated unless the lowest mathematically possible criterion value (0.0) is actually achieved. - **convergence.slow_progress** (dict): Arguments for converging when the evaluations @@ -1193,7 +1193,7 @@ install each of them separately: Default is no averaging (i.e. ``noise_n_evals_per_point(...) = 1``). - **random_directions_orthogonal** (bool): see :ref:`algo_options`. - - **stopping.max_criterion_evaluations** (int): see :ref:`algo_options`. + - **stopping.maxfun** (int): see :ref:`algo_options`. - **threshold_for_safety_step** (float): see :ref:`algo_options`. - **trustregion.expansion_factor_successful** (float): see :ref:`algo_options`. - **trustregion.expansion_factor_very_successful** (float): see :ref:`algo_options`. @@ -1310,7 +1310,7 @@ install each of them separately: - **seek_global_optimum** (bool): whether to apply the heuristic to escape local minima presented in :cite:`Cartis2018a`. Only applies for noisy criterion functions. - - **stopping.max_criterion_evaluations** (int): see :ref:`algo_options`. + - **stopping.maxfun** (int): see :ref:`algo_options`. - **threshold_for_safety_step** (float): see :ref:`algo_options`. - **trustregion.expansion_factor_successful** (float): see :ref:`algo_options`. - **trustregion.expansion_factor_very_successful** (float): see :ref:`algo_options`. @@ -1387,7 +1387,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. evaluation that cannot be done in parallel with other evaluations. Default False. - - **stopping.max_iterations** (int): Number of generations to evolve. + - **stopping.maxiter** (int): Number of generations to evolve. - **kernel_size** (int): Number of solutions stored in the solution archive. - **speed_parameter_q** (float): This parameter manages the convergence speed towards the found minima (the smaller the faster). In the pygmo @@ -1399,7 +1399,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. function's values distances. - **threshold** (int): when the iteration counter reaches the threshold the convergence speed is set to 0.01 automatically. To deactivate this effect - set the threshold to stopping.max_iterations which is the largest allowed + set the threshold to stopping.maxiter which is the largest allowed value. - **speed_of_std_values_convergence** (int): parameter that determines the convergence speed of the standard deviations. This must be an integer @@ -1407,7 +1407,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. - **stopping.max_n_without_improvements** (int): if a positive integer is assigned here, the algorithm will count the runs without improvements, if this number exceeds the given value, the algorithm will be stopped. - - **stopping.max_criterion_evaluations** (int): maximum number of function + - **stopping.maxfun** (int): maximum number of function evaluations. - **focus** (float): this parameter makes the search for the optimum greedier and more focused on local improvements (the higher the greedier). If the @@ -1431,7 +1431,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. in :cite:`Mernik2015`. The algorithm is only suited for bounded parameter spaces. - - **stopping.max_iterations** (int): Number of generations to evolve. + - **stopping.maxiter** (int): Number of generations to evolve. - **seed** (int): seed used by the internal random number generator. - **discard_start_params** (bool): If True, the start params are not guaranteed to be part of the initial population. This saves one criterion function @@ -1463,7 +1463,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. to be part of the initial population. This saves one criterion function evaluation that cannot be done in parallel with other evaluations. Default False. - - **stopping.max_iterations** (int): Number of generations to evolve. + - **stopping.maxiter** (int): Number of generations to evolve. - **weight_coefficient** (float): Weight coefficient. It is denoted by $F$ in the main paper and must lie in [0, 2]. It controls the amplification of the differential variation $(x_{r_2, G} - x_{r_3, G})$. @@ -1484,7 +1484,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. - **convergence.criterion_tolerance**: stopping criteria on the criterion tolerance. Default is 1e-6. It is not clear whether this is the absolute or relative criterion tolerance. - - **convergence.relative_params_tolerance**: stopping criteria on the x + - **convergence.xtol_rel**: stopping criteria on the x tolerance. In pygmo the default is 1e-6 but we use our default value of 1e-5. ``` @@ -1513,7 +1513,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. - **discard_start_params** (bool): If True, the start params are not guaranteed to be part of the initial population. This saves one criterion function evaluation that cannot be done in parallel with other evaluations. Default False. - - **stopping.max_iterations** (int): number of generations to consider. Each generation + - **stopping.maxiter** (int): number of generations to consider. Each generation will compute the objective function once. ``` @@ -1538,7 +1538,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. - **discard_start_params** (bool): If True, the start params are not guaranteed to be part of the initial population. This saves one criterion function evaluation that cannot be done in parallel with other evaluations. Default False. - - **stopping.max_iterations** (int): Number of generations to evolve. + - **stopping.maxiter** (int): Number of generations to evolve. - **crossover_probability** (float): Crossover probability. - **crossover_strategy** (str): the crossover strategy. One of “exponential”,“binomial”, “single” or “sbx”. Default is "exponential". @@ -1587,7 +1587,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. cannot be done in parallel with other evaluations. Default False. - jde (bool): Whether to use the jDE self-adaptation variant to control the $F$ and $CR$ parameter. If True jDE is used, else iDE. - - **stopping.max_iterations** (int): Number of generations to evolve. + - **stopping.maxiter** (int): Number of generations to evolve. - **mutation_variant** (int or str): code for the mutation variant to create a new candidate individual. The default is "rand/1/exp". The first ten are the classical mutation variants introduced in the orginal DE algorithm, the remaining @@ -1644,7 +1644,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. part of the initial population. This saves one criterion function evaluation that cannot be done in parallel with other evaluations. Default False. - - **stopping.max_iterations** (int): Number of generations to evolve. + - **stopping.maxiter** (int): Number of generations to evolve. - **backward_horizon** (float): backward time horizon for the evolution path. It must lie betwen 0 and 1. - **variance_loss_compensation** (float): makes partly up for the small variance loss in @@ -1730,7 +1730,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. - **discard_start_params** (bool): If True, the start params are not guaranteed to be part of the initial population. This saves one criterion function evaluation that cannot be done in parallel with other evaluations. Default False. - - **stopping.max_iterations** (int): Number of generations to evolve. + - **stopping.maxiter** (int): Number of generations to evolve. - **omega** (float): depending on the variant chosen, :math:`\omega` is the particles' inertia weight or the construction coefficient. It must lie between 0 and 1. @@ -1802,7 +1802,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. - **discard_start_params** (bool): If True, the start params are not guaranteed to be part of the initial population. This saves one criterion function evaluation that cannot be done in parallel with other evaluations. Default False. - - **stopping.max_iterations** (int): Number of generations to evolve. + - **stopping.maxiter** (int): Number of generations to evolve. - **omega** (float): depending on the variant chosen, :math:`\omega` is the particles' inertia weight or the constructuion coefficient. It must lie between 0 and 1. @@ -1907,7 +1907,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. - **discard_start_params** (bool): If True, the start params are not guaranteed to be part of the initial population. This saves one criterion function evaluation that cannot be done in parallel with other evaluations. Default False. - - **stopping.max_iterations** (int): Number of generations to evolve. + - **stopping.maxiter** (int): Number of generations to evolve. - **learning_rate_mean_update** (float): learning rate for the mean update (:math:`\eta_\mu`). It must be between 0 and 1 or None. @@ -1952,7 +1952,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. - **discard_start_params** (bool): If True, the start params are not guaranteed to be part of the initial population. This saves one criterion function evaluation that cannot be done in parallel with other evaluations. Default False. - - **stopping.max_iterations** (int): Number of generations to evolve. + - **stopping.maxiter** (int): Number of generations to evolve. ``` @@ -1975,7 +1975,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. - **discard_start_params** (bool): If True, the start params are not guaranteed to be part of the initial population. This saves one criterion function evaluation that cannot be done in parallel with other evaluations. Default False. - - **stopping.max_criterion_evaluations** (int): maximum number of function evaluations. + - **stopping.maxfun** (int): maximum number of function evaluations. - **start_range** (float): the start range. Must be in (0, 1]. - **stop_range** (float): the stop range. Must be in (0, start_range]. - **reduction_coeff** (float): the range reduction coefficient. Must be in (0, 1). @@ -1999,7 +1999,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. - **discard_start_params** (bool): If True, the start params are not guaranteed to be part of the initial population. This saves one criterion function evaluation that cannot be done in parallel with other evaluations. Default False. - - **stopping.max_iterations** (int): Number of generations to evolve. + - **stopping.maxiter** (int): Number of generations to evolve. - **choose_from_memory_probability** (float): probability of choosing from memory (similar to a crossover probability). - **min_pitch_adjustment_rate** (float): minimum pitch adjustment rate. (similar to a @@ -2032,7 +2032,7 @@ supports the following [pygmo2](https://esa.github.io/pygmo2) optimizers. cannot be done in parallel with other evaluations. Default False. - **jde** (bool): Whether to use the jDE self-adaptation variant to control the $F$ and $CR$ parameter. If True jDE is used, else iDE. - - **stopping.max_iterations** (int): Number of generations to evolve. + - **stopping.maxiter** (int): Number of generations to evolve. - **allowed_variants** (array-like object): allowed mutation variants (can be codes or strings). Each code refers to one mutation variant to create a new candidate individual. The first ten refer to the classical mutation variants introduced in @@ -2117,7 +2117,7 @@ To use ipopt, you need to have - print options. - - **convergence.relative_criterion_tolerance** (float): The algorithm + - **convergence.ftol_rel** (float): The algorithm terminates successfully, if the (scaled) non linear programming error becomes smaller than this value. @@ -2133,7 +2133,7 @@ To use ipopt, you need to have - **s_max** (float): Scaling threshold for the NLP error. - - **stopping.max_iterations** (int): If the maximum number of iterations is + - **stopping.maxiter** (int): If the maximum number of iterations is reached, the optimization stops, but we do not count this as successful convergence. The difference to ``max_criterion_evaluations`` is that one iteration might need several criterion evaluations, for example in a line @@ -3315,28 +3315,28 @@ need to have [the fides package](https://github.com/fides-dev/fides) installed - **sr1**: Symmetric Rank 1 update strategy as described in :cite:`Nocedal1999`, Chapter 6.2. - - **convergence.absolute_criterion_tolerance** (float): absolute convergence criterion + - **convergence.ftol_abs** (float): absolute convergence criterion tolerance. This is only the interpretation of this parameter if the relative criterion tolerance is set to 0. Denoting the absolute criterion tolerance by :math:`\alpha` and the relative criterion tolerance by :math:`\beta`, the convergence condition on the criterion improvement is :math:`|f(x_k) - f(x_{k-1})| < \alpha + \beta \cdot |f(x_{k-1})|` - - **convergence.relative_criterion_tolerance** (float): relative convergence criterion + - **convergence.ftol_rel** (float): relative convergence criterion tolerance. This is only the interpretation of this parameter if the absolute criterion tolerance is set to 0 (as is the default). Denoting the absolute criterion tolerance by :math:`\alpha` and the relative criterion tolerance by :math:`\beta`, the convergence condition on the criterion improvement is :math:`|f(x_k) - f(x_{k-1})| < \alpha + \beta \cdot |f(x_{k-1})|` - - **convergence.absolute_params_tolerance** (float): The optimization terminates + - **convergence.xtol_abs** (float): The optimization terminates successfully when the step size falls below this number, i.e. when :math:`||x_{k+1} - x_k||` is smaller than this tolerance. - - **convergence.absolute_gradient_tolerance** (float): The optimization terminates + - **convergence.gtol_abs** (float): The optimization terminates successfully when the gradient norm is less or equal than this tolerance. - - **convergence.relative_gradient_tolerance** (float): The optimization terminates + - **convergence.gtol_rel** (float): The optimization terminates successfully when the norm of the gradient divided by the absolute function value is less or equal to this tolerance. - - **stopping.max_iterations** (int): maximum number of allowed iterations. + - **stopping.maxiter** (int): maximum number of allowed iterations. - **stopping.max_seconds** (int): maximum number of walltime seconds, deactivated by default. @@ -3409,15 +3409,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run For details see :cite:`Powell2009`. - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. ``` @@ -3437,15 +3437,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run that the nlopt version supports bounds. This is done by moving all new points that would lie outside the bounds exactly on the bounds. - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. ``` @@ -3481,15 +3481,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run In case of bounded constraints, this method is dominated by `nlopt_bobyqa` and `nlopt_cobyla`. - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. @@ -3524,15 +3524,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run - Supports unequal initial-step sizes in the different parameters. - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. ``` @@ -3556,15 +3556,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run of Rowan, is that it explicitly supports bound constraints providing big improvement in the case where the optimum lies against one of the constraints. - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. ``` @@ -3591,15 +3591,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run `NEWUOA` requires the dimension n of the parameter space to be `≥ 2`, i.e. the implementation does not handle one-dimensional optimization problems. - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. ``` @@ -3623,15 +3623,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run Detailed description of algorithms is given in :cite:`Dembo1983`. - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. ``` @@ -3655,15 +3655,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run Detailed description of algorithms is given in :cite:`Nocedal1989`, :cite:`Nocedal1980`. - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. ``` @@ -3687,15 +3687,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run The implementation is based on CCSA algorithm described in :cite:`Svanberg2002`. - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. ``` @@ -3719,15 +3719,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run verge to a local optimum from any feasible starting point. - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. ``` @@ -3748,15 +3748,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run Detailed explanation of the algorithm, including its two variations of rank-2 and rank-1 methods can be found in the following paper :cite:`Vlcek2006` . - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. - **rank_1_update** (bool): Whether I rank-1 or rank-2 update is used. @@ -3778,15 +3778,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run The implementation is based on the procedure described in :cite:`Kraft1988` and :cite:`Kraft1994` . - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. ``` @@ -3823,15 +3823,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run - "DIRECT_L_RAND_NOSCAL" - "DIRECT_RAND" - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. - **locally_biased** (bool): Whether the "L" version of the algorithm is selected. @@ -3854,15 +3854,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run More information on this method can be found in :cite:`DaSilva2010` , :cite:`DaSilva2010a` , :cite:`Beyer2002` and :cite:`Vent1975` . - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. ``` @@ -3885,15 +3885,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run :cite:`PhilipRunarsson2005` and :cite:`Thomas2000` . - - **convergence.relative_params_tolerance** (float): Stop when the relative + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. ``` @@ -3917,15 +3917,15 @@ addition to optimagic when using an NLOPT algorithm. To install nlopt run meter population_size. If the user doesn't specify a value, it is set to the nlopt default of 10*(n+1). - - **convergence.relative_params_tolerance** (float): Stop when the relative movement + - **convergence.xtol_rel** (float): Stop when the relative movement between parameter vectors is smaller than this. - - **convergence.absolute_params_tolerance** (float): Stop when the absolute movement + - **convergence.xtol_abs** (float): Stop when the absolute movement between parameter vectors is smaller than this. - - **convergence.relative_criterion_tolerance** (float): Stop when the relative + - **convergence.ftol_rel** (float): Stop when the relative improvement between two iterations is smaller than this. - - **convergence.absolute_criterion_tolerance** (float): Stop when the change of the + - **convergence.ftol_abs** (float): Stop when the change of the criterion function between two iterations is smaller than this. - - **stopping.max_criterion_evaluations** (int): If the maximum number of function + - **stopping.maxfun** (int): If the maximum number of function evaluation is reached, the optimization stops but we do not count this as convergence. - **population_size** (int): Size of the population. If None, it's set to be diff --git a/src/optimagic/benchmarking/run_benchmark.py b/src/optimagic/benchmarking/run_benchmark.py index 1a07ea273..06cfccabd 100644 --- a/src/optimagic/benchmarking/run_benchmark.py +++ b/src/optimagic/benchmarking/run_benchmark.py @@ -39,7 +39,7 @@ def run_benchmark( dictionary that maps a name for optimizer settings (e.g. ``"lbfgsb_strict_criterion"``) to a dictionary of keyword arguments for arguments for ``minimize`` (e.g. ``{"algorithm": "scipy_lbfgsb", - "algo_options": {"convergence.relative_criterion_tolerance": 1e-12}}``). + "algo_options": {"convergence.ftol_rel": 1e-12}}``). Alternatively, the values can just be an algorithm which is then benchmarked at default settings. batch_evaluator (str or callable): See :ref:`batch_evaluators`. @@ -115,12 +115,12 @@ def _process_optimize_options(raw_options, max_evals, disable_convergence): default_algo_options = {} if max_evals is not None: - default_algo_options["stopping.max_criterion_evaluations"] = max_evals - default_algo_options["stopping.max_iterations"] = max_evals + default_algo_options["stopping.maxfun"] = max_evals + default_algo_options["stopping.maxiter"] = max_evals if disable_convergence: - default_algo_options["convergence.relative_criterion_tolerance"] = 1e-14 - default_algo_options["convergence.relative_params_tolerance"] = 1e-14 - default_algo_options["convergence.relative_gradient_tolerance"] = 1e-14 + default_algo_options["convergence.ftol_rel"] = 1e-14 + default_algo_options["convergence.xtol_rel"] = 1e-14 + default_algo_options["convergence.gtol_rel"] = 1e-14 out_options = {} for name, _option in dict_options.items(): diff --git a/src/optimagic/deprecations.py b/src/optimagic/deprecations.py index f99644864..1d5defe8e 100644 --- a/src/optimagic/deprecations.py +++ b/src/optimagic/deprecations.py @@ -58,3 +58,40 @@ def throw_criterion_and_derivative_kwargs_future_warning(): "0.6.0 and later." ) warnings.warn(msg, FutureWarning) + + +def replace_and_warn_about_deprecated_algo_options(algo_options): + if not isinstance(algo_options, dict): + return algo_options + + algo_options = {k.replace(".", "_"): v for k, v in algo_options.items()} + + replacements = { + "stopping_max_criterion_evaluations": "stopping_maxfun", + "stopping_max_iterations": "stopping_maxiter", + "convergence_absolute_criterion_tolerance": "convergence_ftol_abs", + "convergence_relative_criterion_tolerance": "convergence_ftol_rel", + "convergence_scaled_criterion_tolerance": "convergence_ftol_scaled", + "convergence_absolute_params_tolerance": "convergence_xtol_abs", + "convergence_relative_params_tolerance": "convergence_xtol_rel", + "convergence_absolute_gradient_tolerance": "convergence_gtol_abs", + "convergence_relative_gradient_tolerance": "convergence_gtol_rel", + "convergence_scaled_gradient_tolerance": "convergence_gtol_scaled", + } + + present = sorted(set(algo_options) & set(replacements)) + if present: + msg = ( + "The following keys in `algo_options` are deprecated and will be removed " + "in optimagic version 0.6.0 and later. Please replace them as follows:\n" + ) + for k in present: + msg += f" {k} -> {replacements[k]}\n" + + warnings.warn(msg, FutureWarning) + + out = {k: v for k, v in algo_options.items() if k not in present} + for k in present: + out[replacements[k]] = algo_options[k] + + return out diff --git a/src/optimagic/optimization/algo_options.py b/src/optimagic/optimization/algo_options.py index 24d0cb9e4..5c854bc7e 100644 --- a/src/optimagic/optimization/algo_options.py +++ b/src/optimagic/optimization/algo_options.py @@ -14,7 +14,7 @@ ===================================================================================== """ -CONVERGENCE_RELATIVE_CRITERION_TOLERANCE = 2e-9 +CONVERGENCE_FTOL_REL = 2e-9 """float: Stop when the relative improvement between two iterations is below this. The exact definition of relative improvement depends on the optimizer and should @@ -24,14 +24,14 @@ """ -CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE = 0 +CONVERGENCE_FTOL_ABS = 0 """float: Stop when the absolute improvement between two iterations is below this. Disabled by default because it is very problem specific. """ -CONVERGENCE_ABSOLUTE_GRADIENT_TOLERANCE = 1e-5 +CONVERGENCE_GTOL_ABS = 1e-5 """float: Stop when the gradient are smaller than this. For some algorithms this criterion refers to all entries, for others to some norm. @@ -43,7 +43,7 @@ """ -CONVERGENCE_RELATIVE_GRADIENT_TOLERANCE = 1e-8 +CONVERGENCE_GTOL_REL = 1e-8 """float: Stop when the gradient, divided by the absolute value of the criterion function is smaller than this. For some algorithms this criterion refers to all entries, for others to some norm.For bound constrained optimizers this @@ -52,7 +52,7 @@ """ -CONVERGENCE_SCALED_GRADIENT_TOLERANCE = 1e-8 +CONVERGENCE_GTOL_SCALED = 1e-8 """float: Stop when all entries (or for some algorithms the norm) of the gradient, divided by the norm of the gradient at start parameters is smaller than this. For bound constrained optimizers this typically refers to a projected gradient. @@ -61,7 +61,7 @@ """ -CONVERGENCE_RELATIVE_PARAMS_TOLERANCE = 1e-5 +CONVERGENCE_XTOL_REL = 1e-5 """float: Stop when the relative change in parameters is smaller than this. The exact definition of relative change and whether this refers to the maximum change or the average change depends on the algorithm and should be documented @@ -69,7 +69,7 @@ """ -CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE = 0 +CONVERGENCE_XTOL_ABS = 0 """float: Stop when the absolute change in parameters between two iterations is smaller than this. Whether this refers to the maximum change or the average change depends on the algorithm and should be documented there. @@ -79,7 +79,7 @@ """ -CONVERGENCE_NOISE_CORRECTED_CRITERION_TOLERANCE = 1.0 +CONVERGENCE_NOISE_CORRECTED_FTOL = 1.0 """float: Stop when the evaluations on the set of interpolation points all fall within this factor of the noise level. The default is 1, i.e. when all evaluations are within the noise level. If you want to not use this criterion but still flag your @@ -94,7 +94,7 @@ """float: Stop when the lower trust region radius falls below this value.""" -STOPPING_MAX_CRITERION_EVALUATIONS = 1_000_000 +STOPPING_MAXFUN = 1_000_000 """int: If the maximum number of function evaluation is reached, the optimization stops but we do not count this as successful convergence. The function evaluations used @@ -103,7 +103,7 @@ """ -STOPPING_MAX_CRITERION_EVALUATIONS_GLOBAL = 1_000 +STOPPING_MAXFUN_GLOBAL = 1_000 """int: If the maximum number of function evaluation is reached, the optimization stops but we do not count this as successful convergence. The function evaluations used @@ -113,7 +113,7 @@ """ -STOPPING_MAX_ITERATIONS = 1_000_000 +STOPPING_MAXITER = 1_000_000 """int: If the maximum number of iterations is reached, the optimization stops, but we do not count this as successful convergence. @@ -123,14 +123,14 @@ """ -CONVERGENCE_SECOND_BEST_ABSOLUTE_CRITERION_TOLERANCE = 1e-08 +CONVERGENCE_SECOND_BEST_FTOL_ABS = 1e-08 """float: absolute criterion tolerance optimagic requires if no other stopping criterion apart from max iterations etc. is available this is taken from scipy (SLSQP's value, smaller than Nelder-Mead). """ -CONVERGENCE_SECOND_BEST_ABSOLUTE_PARAMS_TOLERANCE = 1e-08 +CONVERGENCE_SECOND_BEST_XTOL_ABS = 1e-08 """float: The absolute parameter tolerance optimagic requires if no other stopping criterion apart from max iterations etc. is available. This is taken from pybobyqa. diff --git a/src/optimagic/optimization/optimize.py b/src/optimagic/optimization/optimize.py index c0d06957c..4c9074d53 100644 --- a/src/optimagic/optimization/optimize.py +++ b/src/optimagic/optimization/optimize.py @@ -40,6 +40,7 @@ ) from optimagic.optimization.scipy_aliases import map_method_to_algorithm from optimagic import deprecations +from optimagic.deprecations import replace_and_warn_about_deprecated_algo_options def maximize( @@ -346,6 +347,8 @@ def _optimize( else fun_and_jac_kwargs ) + algo_options = replace_and_warn_about_deprecated_algo_options(algo_options) + # ================================================================================== # handle scipy aliases # ================================================================================== diff --git a/src/optimagic/optimizers/bhhh.py b/src/optimagic/optimizers/bhhh.py index df8cc0a8c..10927ee66 100644 --- a/src/optimagic/optimizers/bhhh.py +++ b/src/optimagic/optimizers/bhhh.py @@ -15,8 +15,8 @@ def bhhh( criterion_and_derivative, x, *, - convergence_absolute_gradient_tolerance=1e-8, - stopping_max_iterations=200, + converence_gtol_abs=1e-8, + stopping_maxiter=200, ): """Minimize a likelihood function using the BHHH algorithm. @@ -27,8 +27,8 @@ def bhhh( result_dict = bhhh_internal( criterion_and_derivative, x=x, - convergence_absolute_gradient_tolerance=convergence_absolute_gradient_tolerance, - stopping_max_iterations=stopping_max_iterations, + convergence_gtol_abs=converence_gtol_abs, + stopping_maxiter=stopping_maxiter, ) return result_dict @@ -37,8 +37,8 @@ def bhhh( def bhhh_internal( criterion_and_derivative, x, - convergence_absolute_gradient_tolerance, - stopping_max_iterations, + convergence_gtol_abs, + stopping_maxiter, ): """Minimize a likelihood function using the BHHH algorithm. @@ -72,7 +72,7 @@ def bhhh_internal( step_size = initial_step_size niter = 1 - while niter < stopping_max_iterations: + while niter < stopping_maxiter: niter += 1 x_candidate = x_accepted + step_size * direction @@ -114,7 +114,7 @@ def bhhh_internal( # Reset stepsize step_size = initial_step_size - if gtol < convergence_absolute_gradient_tolerance: + if gtol < convergence_gtol_abs: break result_dict = { diff --git a/src/optimagic/optimizers/fides.py b/src/optimagic/optimizers/fides.py index feb292fbd..3ebd34642 100644 --- a/src/optimagic/optimizers/fides.py +++ b/src/optimagic/optimizers/fides.py @@ -8,12 +8,12 @@ from optimagic.decorators import mark_minimizer from optimagic.exceptions import NotInstalledError from optimagic.optimization.algo_options import ( - CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - CONVERGENCE_ABSOLUTE_GRADIENT_TOLERANCE, - CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - CONVERGENCE_RELATIVE_GRADIENT_TOLERANCE, - STOPPING_MAX_ITERATIONS, + CONVERGENCE_FTOL_ABS, + CONVERGENCE_GTOL_ABS, + CONVERGENCE_XTOL_ABS, + CONVERGENCE_FTOL_REL, + CONVERGENCE_GTOL_REL, + STOPPING_MAXITER, ) if IS_FIDES_INSTALLED: @@ -33,12 +33,12 @@ def fides( upper_bounds, *, hessian_update_strategy="bfgs", - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_absolute_gradient_tolerance=CONVERGENCE_ABSOLUTE_GRADIENT_TOLERANCE, - convergence_relative_gradient_tolerance=CONVERGENCE_RELATIVE_GRADIENT_TOLERANCE, - stopping_max_iterations=STOPPING_MAX_ITERATIONS, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_gtol_abs=CONVERGENCE_GTOL_ABS, + convergence_gtol_rel=CONVERGENCE_GTOL_REL, + stopping_maxiter=STOPPING_MAXITER, stopping_max_seconds=np.inf, trustregion_initial_radius=1.0, trustregion_stepback_strategy="truncate", @@ -64,19 +64,19 @@ def fides( fides_options = { "delta_init": trustregion_initial_radius, "eta": trustregion_increase_threshold, - "fatol": convergence_absolute_criterion_tolerance, - "frtol": convergence_relative_criterion_tolerance, + "fatol": convergence_ftol_abs, + "frtol": convergence_ftol_rel, "gamma1": trustregion_decrease_factor, "gamma2": trustregion_increase_factor, - "gatol": convergence_absolute_gradient_tolerance, - "grtol": convergence_relative_gradient_tolerance, - "maxiter": stopping_max_iterations, + "gatol": convergence_gtol_abs, + "grtol": convergence_gtol_rel, + "maxiter": stopping_maxiter, "maxtime": stopping_max_seconds, "mu": trustregion_decrease_threshold, "stepback_strategy": trustregion_stepback_strategy, "subspace_solver": trustregion_subspace_dimension, "theta_max": trustregion_max_stepback_fraction, - "xtol": convergence_absolute_params_tolerance, + "xtol": convergence_xtol_abs, } hessian_instance = _create_hessian_updater_from_user_input(hessian_update_strategy) diff --git a/src/optimagic/optimizers/ipopt.py b/src/optimagic/optimizers/ipopt.py index ef24c33ce..f80f50733 100644 --- a/src/optimagic/optimizers/ipopt.py +++ b/src/optimagic/optimizers/ipopt.py @@ -6,8 +6,8 @@ from optimagic.decorators import mark_minimizer from optimagic.exceptions import NotInstalledError from optimagic.optimization.algo_options import ( - CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - STOPPING_MAX_ITERATIONS, + CONVERGENCE_FTOL_REL, + STOPPING_MAXITER, ) from optimagic.optimizers.scipy_optimizers import process_scipy_result @@ -31,14 +31,14 @@ def ipopt( # nonlinear constraints nonlinear_constraints=(), # convergence criteria - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, dual_inf_tol=1.0, constr_viol_tol=0.0001, compl_inf_tol=0.0001, s_max=100.0, mu_target=0.0, # stopping criteria - stopping_max_iterations=STOPPING_MAX_ITERATIONS, + stopping_maxiter=STOPPING_MAXITER, stopping_max_wall_time_seconds=1e20, stopping_max_cpu_time=1e20, # acceptable heuristic @@ -225,7 +225,7 @@ def ipopt( "The 'ipopt' algorithm requires the cyipopt package to be installed. " "You can it with: `conda install -c conda-forge cyipopt`." ) - if acceptable_tol <= convergence_relative_criterion_tolerance: + if acceptable_tol <= convergence_ftol_rel: raise ValueError( "The acceptable tolerance must be larger than the desired tolerance." ) @@ -246,9 +246,7 @@ def ipopt( # The default value is actually 1e2*tol, where tol is the general # termination tolerance. if resto_failure_feasibility_threshold is None: - resto_failure_feasibility_threshold = ( - 1e2 * convergence_relative_criterion_tolerance - ) + resto_failure_feasibility_threshold = 1e2 * convergence_ftol_rel # convert None to str none section linear_solver_options_with_none = [ @@ -333,7 +331,7 @@ def ipopt( # disable derivative checker "derivative_test": "none", "s_max": float(s_max), - "max_iter": stopping_max_iterations, + "max_iter": stopping_maxiter, "max_wall_time": float(stopping_max_wall_time_seconds), "max_cpu_time": stopping_max_cpu_time, "dual_inf_tol": dual_inf_tol, @@ -498,7 +496,7 @@ def ipopt( bounds=_get_scipy_bounds(lower_bounds, upper_bounds), jac=derivative, constraints=nonlinear_constraints, - tol=convergence_relative_criterion_tolerance, + tol=convergence_ftol_rel, options=options, ) diff --git a/src/optimagic/optimizers/nag_optimizers.py b/src/optimagic/optimizers/nag_optimizers.py index ff869e24d..6dc35c6bf 100644 --- a/src/optimagic/optimizers/nag_optimizers.py +++ b/src/optimagic/optimizers/nag_optimizers.py @@ -18,13 +18,13 @@ from optimagic.optimization.algo_options import ( CLIP_CRITERION_IF_OVERFLOWING, CONVERGENCE_MINIMAL_TRUSTREGION_RADIUS_TOLERANCE, - CONVERGENCE_NOISE_CORRECTED_CRITERION_TOLERANCE, + CONVERGENCE_NOISE_CORRECTED_FTOL, CONVERGENCE_SLOW_PROGRESS, INITIAL_DIRECTIONS, INTERPOLATION_ROUNDING_ERROR, RANDOM_DIRECTIONS_ORTHOGONAL, RESET_OPTIONS, - STOPPING_MAX_CRITERION_EVALUATIONS, + STOPPING_MAXFUN, THRESHOLD_FOR_SAFETY_STEP, TRUSTREGION_EXPANSION_FACTOR_SUCCESSFUL, TRUSTREGION_EXPANSION_FACTOR_VERY_SUCCESSFUL, @@ -59,8 +59,8 @@ def nag_dfols( *, clip_criterion_if_overflowing=CLIP_CRITERION_IF_OVERFLOWING, convergence_minimal_trustregion_radius_tolerance=CONVERGENCE_MINIMAL_TRUSTREGION_RADIUS_TOLERANCE, # noqa: E501 - convergence_noise_corrected_criterion_tolerance=CONVERGENCE_NOISE_CORRECTED_CRITERION_TOLERANCE, # noqa: E501 - convergence_scaled_criterion_tolerance=0.0, + convergence_noise_corrected_criterion_tolerance=CONVERGENCE_NOISE_CORRECTED_FTOL, # noqa: E501 + convergence_ftol_scaled=0.0, convergence_slow_progress=None, initial_directions=INITIAL_DIRECTIONS, interpolation_rounding_error=INTERPOLATION_ROUNDING_ERROR, @@ -68,7 +68,7 @@ def nag_dfols( noise_multiplicative_level=None, noise_n_evals_per_point=None, random_directions_orthogonal=RANDOM_DIRECTIONS_ORTHOGONAL, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + stopping_maxfun=STOPPING_MAXFUN, threshold_for_safety_step=THRESHOLD_FOR_SAFETY_STEP, trustregion_expansion_factor_successful=TRUSTREGION_EXPANSION_FACTOR_SUCCESSFUL, trustregion_expansion_factor_very_successful=TRUSTREGION_EXPANSION_FACTOR_VERY_SUCCESSFUL, # noqa: E501 @@ -186,7 +186,7 @@ def nag_dfols( "n_extra_interpolation_points_per_hard_reset" ] - trustregion_reset_options["n_extra_interpolation_points_per_soft_reset"], - "model.rel_tol": convergence_scaled_criterion_tolerance, + "model.rel_tol": convergence_ftol_scaled, "regression.num_extra_steps": trustregion_n_extra_points_to_replace_successful, "regression.momentum_extra_steps": trustregion_use_momentum, "regression.increase_num_extra_steps_with_restart": trustregion_reset_options[ @@ -226,7 +226,7 @@ def nag_dfols( criterion, x0=x, bounds=(lower_bounds, upper_bounds), - maxfun=stopping_max_criterion_evaluations, + maxfun=stopping_maxfun, rhobeg=trustregion_initial_radius, npt=trustregion_n_interpolation_points, rhoend=convergence_minimal_trustregion_radius_tolerance, @@ -255,7 +255,7 @@ def nag_pybobyqa( clip_criterion_if_overflowing=CLIP_CRITERION_IF_OVERFLOWING, convergence_criterion_value=None, convergence_minimal_trustregion_radius_tolerance=CONVERGENCE_MINIMAL_TRUSTREGION_RADIUS_TOLERANCE, # noqa: E501 - convergence_noise_corrected_criterion_tolerance=CONVERGENCE_NOISE_CORRECTED_CRITERION_TOLERANCE, # noqa: E501 + convergence_noise_corrected_criterion_tolerance=CONVERGENCE_NOISE_CORRECTED_FTOL, # noqa: E501 convergence_slow_progress=None, initial_directions=INITIAL_DIRECTIONS, interpolation_rounding_error=INTERPOLATION_ROUNDING_ERROR, @@ -264,7 +264,7 @@ def nag_pybobyqa( noise_n_evals_per_point=None, random_directions_orthogonal=RANDOM_DIRECTIONS_ORTHOGONAL, seek_global_optimum=False, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + stopping_max_criterion_evaluations=STOPPING_MAXFUN, threshold_for_safety_step=THRESHOLD_FOR_SAFETY_STEP, trustregion_expansion_factor_successful=TRUSTREGION_EXPANSION_FACTOR_SUCCESSFUL, trustregion_expansion_factor_very_successful=TRUSTREGION_EXPANSION_FACTOR_VERY_SUCCESSFUL, # noqa: E501 diff --git a/src/optimagic/optimizers/neldermead.py b/src/optimagic/optimizers/neldermead.py index 7bb2f6e97..446a74663 100644 --- a/src/optimagic/optimizers/neldermead.py +++ b/src/optimagic/optimizers/neldermead.py @@ -5,9 +5,9 @@ from optimagic.batch_evaluators import process_batch_evaluator from optimagic.decorators import mark_minimizer from optimagic.optimization.algo_options import ( - CONVERGENCE_SECOND_BEST_ABSOLUTE_CRITERION_TOLERANCE, - CONVERGENCE_SECOND_BEST_ABSOLUTE_PARAMS_TOLERANCE, - STOPPING_MAX_ITERATIONS, + CONVERGENCE_SECOND_BEST_FTOL_ABS, + CONVERGENCE_SECOND_BEST_XTOL_ABS, + STOPPING_MAXITER, ) @@ -25,9 +25,9 @@ def neldermead_parallel( init_simplex_method="gao_han", n_cores=1, adaptive=True, - stopping_max_iterations=STOPPING_MAX_ITERATIONS, - convergence_absolute_criterion_tolerance=CONVERGENCE_SECOND_BEST_ABSOLUTE_CRITERION_TOLERANCE, # noqa: E501 - convergence_absolute_params_tolerance=CONVERGENCE_SECOND_BEST_ABSOLUTE_PARAMS_TOLERANCE, # noqa: E501 + stopping_maxiter=STOPPING_MAXITER, + convergence_ftol_abs=CONVERGENCE_SECOND_BEST_FTOL_ABS, # noqa: E501 + convergence_xtol_abs=CONVERGENCE_SECOND_BEST_XTOL_ABS, # noqa: E501 batch_evaluator="joblib", ): """Parallel Nelder-Mead algorithm following Lee D., Wiswall M., A parallel @@ -52,15 +52,14 @@ def neldermead_parallel( for simplex size. The default is True. - stopping_max_iterations (int): Maximum number of algorithm iterations. + stopping_maxiter (int): Maximum number of algorithm iterations. The default is STOPPING_MAX_ITERATIONS. - convergence_absolute_criterion_tolerance (float): maximal difference between + convergence_ftol_abs (float): maximal difference between function value evaluated on simplex points. - The default is CONVERGENCE_SECOND_BEST_ABSOLUTE_CRITERION_TOLERANCE. - convergence_absolute_params_tolerance (float): maximal distance between points in - the simplex. The default is CONVERGENCE_SECOND_BEST_ABSOLUTE_PARAMS_TOLERANCE. + convergence_xtol_abs (float): maximal distance between points in + the simplex. batch_evaluator (string or callable): See :ref:`batch_evaluators` for details. Default "joblib". @@ -232,16 +231,14 @@ def func_parallel(args): # termination criteria if ( - np.max(np.abs(f_s[0, :] - f_s[1:, :])) - <= convergence_absolute_criterion_tolerance - and np.max(np.abs(s[0, :] - s[1:,])) - <= convergence_absolute_params_tolerance + np.max(np.abs(f_s[0, :] - f_s[1:, :])) <= convergence_ftol_abs + and np.max(np.abs(s[0, :] - s[1:,])) <= convergence_xtol_abs ): optimal = True converge = True reason_to_stop = "Termination codition satisfied" elif ( - iterations >= stopping_max_iterations + iterations >= stopping_maxiter ): # if maximum amount of iteration is exceeded optimal = True converge = False diff --git a/src/optimagic/optimizers/nlopt_optimizers.py b/src/optimagic/optimizers/nlopt_optimizers.py index 46001dd66..55056bec9 100644 --- a/src/optimagic/optimizers/nlopt_optimizers.py +++ b/src/optimagic/optimizers/nlopt_optimizers.py @@ -9,12 +9,12 @@ from optimagic.config import IS_NLOPT_INSTALLED from optimagic.decorators import mark_minimizer from optimagic.optimization.algo_options import ( - CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - STOPPING_MAX_CRITERION_EVALUATIONS, - STOPPING_MAX_CRITERION_EVALUATIONS_GLOBAL, + CONVERGENCE_FTOL_ABS, + CONVERGENCE_XTOL_ABS, + CONVERGENCE_FTOL_REL, + CONVERGENCE_XTOL_REL, + STOPPING_MAXFUN, + STOPPING_MAXFUN_GLOBAL, ) from optimagic.parameters.nonlinear_constraints import ( equality_as_inequality_constraints, @@ -36,11 +36,11 @@ def nlopt_bobyqa( lower_bounds, upper_bounds, *, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN, ): """Minimize a scalar function using the BOBYQA algorithm. @@ -55,11 +55,11 @@ def nlopt_bobyqa( upper_bounds, derivative=None, algorithm=nlopt.LN_BOBYQA, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) return out @@ -77,11 +77,11 @@ def nlopt_neldermead( lower_bounds, upper_bounds, *, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=0, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=0, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN, ): """Minimize a scalar function using the Nelder-Mead simplex algorithm. @@ -97,11 +97,11 @@ def nlopt_neldermead( upper_bounds, algorithm=nlopt.LN_NELDERMEAD, derivative=None, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) return out @@ -117,11 +117,11 @@ def nlopt_praxis( criterion, x, *, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN, ): """Minimize a scalar function using principal-axis method. @@ -136,11 +136,11 @@ def nlopt_praxis( upper_bounds=None, algorithm=nlopt.LN_PRAXIS, derivative=None, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) return out @@ -159,11 +159,11 @@ def nlopt_cobyla( upper_bounds, *, nonlinear_constraints=(), - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN, ): """Minimize a scalar function using the cobyla method. @@ -180,11 +180,11 @@ def nlopt_cobyla( algorithm=nlopt.LN_COBYLA, derivative=None, nonlinear_constraints=nonlinear_constraints, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) return out @@ -202,11 +202,11 @@ def nlopt_sbplx( lower_bounds, upper_bounds, *, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN, ): """Minimize a scalar function using the "Subplex" algorithm. @@ -221,11 +221,11 @@ def nlopt_sbplx( lower_bounds, upper_bounds, algorithm=nlopt.LN_SBPLX, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) return out @@ -243,11 +243,11 @@ def nlopt_newuoa( lower_bounds, upper_bounds, *, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN, ): """Minimize a scalar function using the NEWUOA algorithm. @@ -266,11 +266,11 @@ def nlopt_newuoa( lower_bounds, upper_bounds, algorithm=algo, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) return out @@ -289,11 +289,11 @@ def nlopt_tnewton( lower_bounds, upper_bounds, *, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN, ): """Minimize a scalar function using the "TNEWTON" algorithm. @@ -309,11 +309,11 @@ def nlopt_tnewton( upper_bounds, algorithm=nlopt.LD_TNEWTON, derivative=derivative, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) return out @@ -332,11 +332,11 @@ def nlopt_lbfgs( lower_bounds, upper_bounds, *, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN, ): """Minimize a scalar function using the "LBFGS" algorithm. @@ -352,11 +352,11 @@ def nlopt_lbfgs( upper_bounds, algorithm=nlopt.LD_TNEWTON, derivative=derivative, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) return out @@ -375,11 +375,11 @@ def nlopt_ccsaq( lower_bounds, upper_bounds, *, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN, ): """Minimize a scalar function using CCSAQ algorithm. @@ -394,11 +394,11 @@ def nlopt_ccsaq( upper_bounds, algorithm=nlopt.LD_CCSAQ, derivative=derivative, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) return out @@ -418,11 +418,11 @@ def nlopt_mma( upper_bounds, *, nonlinear_constraints=(), - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN, ): """Minimize a scalar function using the method of moving asymptotes (MMA). @@ -441,11 +441,11 @@ def nlopt_mma( algorithm=nlopt.LD_MMA, derivative=derivative, nonlinear_constraints=nonlinear_constraints, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) return out @@ -464,11 +464,11 @@ def nlopt_var( lower_bounds, upper_bounds, *, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN, rank_1_update=True, ): """Minimize a scalar function limited memory switching variable-metric method. @@ -488,11 +488,11 @@ def nlopt_var( upper_bounds, algorithm=algo, derivative=derivative, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) return out @@ -512,11 +512,11 @@ def nlopt_slsqp( upper_bounds, *, nonlinear_constraints=(), - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN, ): """Optimize a scalar function based on SLSQP method. @@ -532,11 +532,11 @@ def nlopt_slsqp( algorithm=nlopt.LD_SLSQP, derivative=derivative, nonlinear_constraints=nonlinear_constraints, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) return out @@ -554,11 +554,11 @@ def nlopt_direct( lower_bounds, upper_bounds, *, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS_GLOBAL, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN_GLOBAL, locally_biased=False, random_search=False, unscaled_bounds=False, @@ -587,11 +587,11 @@ def nlopt_direct( lower_bounds, upper_bounds, algorithm=algo, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) # this is a global optimizer @@ -612,11 +612,11 @@ def nlopt_esch( lower_bounds, upper_bounds, *, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS_GLOBAL, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN_GLOBAL, ): """Optimize a scalar function using the ESCH algorithm. @@ -630,11 +630,11 @@ def nlopt_esch( lower_bounds, upper_bounds, algorithm=nlopt.GN_ESCH, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) # this is a global optimizer @@ -656,11 +656,11 @@ def nlopt_isres( upper_bounds, *, nonlinear_constraints=(), - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS_GLOBAL, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN_GLOBAL, ): """Optimize a scalar function using the ISRES algorithm. @@ -675,11 +675,11 @@ def nlopt_isres( upper_bounds, algorithm=nlopt.GN_ISRES, nonlinear_constraints=nonlinear_constraints, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, ) # this is a global optimizer @@ -700,11 +700,11 @@ def nlopt_crs2_lm( lower_bounds, upper_bounds, *, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS_GLOBAL, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN_GLOBAL, population_size=None, ): """Optimize a scalar function using the CRS2_LM algorithm. @@ -721,11 +721,11 @@ def nlopt_crs2_lm( lower_bounds, upper_bounds, algorithm=nlopt.GN_CRS2_LM, - convergence_xtol_rel=convergence_relative_params_tolerance, - convergence_xtol_abs=convergence_absolute_params_tolerance, - convergence_ftol_rel=convergence_relative_criterion_tolerance, - convergence_ftol_abs=convergence_absolute_criterion_tolerance, - stopping_max_eval=stopping_max_criterion_evaluations, + convergence_xtol_rel=convergence_xtol_rel, + convergence_xtol_abs=convergence_xtol_abs, + convergence_ftol_rel=convergence_ftol_rel, + convergence_ftol_abs=convergence_ftol_abs, + stopping_max_eval=stopping_maxfun, population_size=population_size, ) @@ -823,12 +823,12 @@ def _process_nlopt_results(nlopt_obj, solution_x): "Optimizer stopped because maximum value of criterion function was reached" ), 3: ( - "Optimizer stopped because convergence_relative_criterion_tolerance or " - "convergence_absolute_criterion_tolerance was reached" + "Optimizer stopped because convergence_ftol_rel or " + "convergence_ftol_abs was reached" ), 4: ( - "Optimizer stopped because convergence_relative_params_tolerance or " - "convergence_absolute_params_tolerance was reached" + "Optimizer stopped because convergence_xtol_rel or " + "convergence_xtol_abs was reached" ), 5: "Optimizer stopped because max_criterion_evaluations was reached", 6: "Optimizer stopped because max running time was reached", diff --git a/src/optimagic/optimizers/pounders.py b/src/optimagic/optimizers/pounders.py index 18f8ed8f4..37a767400 100644 --- a/src/optimagic/optimizers/pounders.py +++ b/src/optimagic/optimizers/pounders.py @@ -37,11 +37,11 @@ def pounders( x, lower_bounds, upper_bounds, - convergence_absolute_gradient_tolerance=1e-8, - convergence_relative_gradient_tolerance=1e-8, - convergence_scaled_gradient_tolerance=False, + convergence_gtol_abs=1e-8, + convergence_gtol_rel=1e-8, + convergence_gtol_scaled=False, max_interpolation_points=None, - stopping_max_iterations=2_000, + stopping_maxiter=2_000, trustregion_initial_radius=0.1, trustregion_minimal_radius=1e-6, trustregion_maximal_radius=1e6, @@ -97,11 +97,11 @@ def pounders( x0=x, lower_bounds=lower_bounds, upper_bounds=upper_bounds, - gtol_abs=convergence_absolute_gradient_tolerance, - gtol_rel=convergence_relative_gradient_tolerance, - gtol_scaled=convergence_scaled_gradient_tolerance, + gtol_abs=convergence_gtol_abs, + gtol_rel=convergence_gtol_rel, + gtol_scaled=convergence_gtol_scaled, maxinterp=max_interpolation_points, - maxiter=stopping_max_iterations, + maxiter=stopping_maxiter, delta=trustregion_initial_radius, delta_min=trustregion_minimal_radius, delta_max=trustregion_maximal_radius, diff --git a/src/optimagic/optimizers/pygmo_optimizers.py b/src/optimagic/optimizers/pygmo_optimizers.py index 754a8559f..7a907d327 100644 --- a/src/optimagic/optimizers/pygmo_optimizers.py +++ b/src/optimagic/optimizers/pygmo_optimizers.py @@ -10,8 +10,8 @@ from optimagic.decorators import mark_minimizer from optimagic.exceptions import NotInstalledError from optimagic.optimization.algo_options import ( - CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - STOPPING_MAX_CRITERION_EVALUATIONS_GLOBAL, + CONVERGENCE_XTOL_REL, + STOPPING_MAXFUN_GLOBAL, get_population_size, ) @@ -39,7 +39,7 @@ def pygmo_gaco( n_cores=1, seed=None, discard_start_params=False, - stopping_max_iterations=STOPPING_MAX_ITERATIONS_GENETIC, + stopping_maxiter=STOPPING_MAX_ITERATIONS_GENETIC, kernel_size=63, speed_parameter_q=1.0, oracle=0.0, @@ -47,7 +47,7 @@ def pygmo_gaco( threshold=1, speed_of_std_values_convergence=7, stopping_max_n_without_improvements=100000, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS_GLOBAL, + stopping_maxfun=STOPPING_MAXFUN_GLOBAL, focus=0.0, cache=False, ): @@ -71,7 +71,7 @@ def pygmo_gaco( ) algo_specific_options = { - "gen": int(stopping_max_iterations), + "gen": int(stopping_maxiter), "ker": kernel_size, "q": speed_parameter_q, "oracle": oracle, @@ -79,7 +79,7 @@ def pygmo_gaco( "threshold": threshold, "n_gen_mark": int(speed_of_std_values_convergence), "impstop": stopping_max_n_without_improvements, - "evalstop": stopping_max_criterion_evaluations, + "evalstop": stopping_maxfun, "focus": focus, "memory": cache, } @@ -116,7 +116,7 @@ def pygmo_bee_colony( lower_bounds, upper_bounds, *, - stopping_max_iterations=STOPPING_MAX_ITERATIONS_GENETIC, + stopping_maxiter=STOPPING_MAX_ITERATIONS_GENETIC, seed=None, discard_start_params=False, max_n_trials=1, @@ -137,7 +137,7 @@ def pygmo_bee_colony( discard_start_params=discard_start_params, algo_specific_options={ "limit": max_n_trials, - "gen": int(stopping_max_iterations), + "gen": int(stopping_maxiter), }, ) @@ -168,12 +168,12 @@ def pygmo_de( population_size=None, seed=None, discard_start_params=False, - stopping_max_iterations=STOPPING_MAX_ITERATIONS_GENETIC, + stopping_maxiter=STOPPING_MAX_ITERATIONS_GENETIC, weight_coefficient=0.8, crossover_probability=0.9, mutation_variant="rand/1/exp", convergence_criterion_tolerance=1e-6, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, + convergence_relative_params_tolerance=CONVERGENCE_XTOL_REL, ): """Minimize a scalar function using the differential evolution algorithm. @@ -203,7 +203,7 @@ def pygmo_de( ) algo_specific_options = { - "gen": int(stopping_max_iterations), + "gen": int(stopping_maxiter), "F": weight_coefficient, "CR": crossover_probability, "variant": mutation_variant, @@ -244,7 +244,7 @@ def pygmo_sea( population_size=None, seed=None, discard_start_params=False, - stopping_max_iterations=10_000, # Each generation will compute the objective once + stopping_maxiter=10_000, # Each generation will compute the objective once ): r"""Minimize a scalar function using the (N+1)-ES simple evolutionary algorithm. @@ -261,7 +261,7 @@ def pygmo_sea( population_size=population_size, seed=seed, discard_start_params=discard_start_params, - algo_specific_options={"gen": int(stopping_max_iterations)}, + algo_specific_options={"gen": int(stopping_maxiter)}, ) res = _minimize_pygmo( @@ -291,7 +291,7 @@ def pygmo_sga( population_size=None, seed=None, discard_start_params=False, - stopping_max_iterations=STOPPING_MAX_ITERATIONS_GENETIC, + stopping_maxiter=STOPPING_MAX_ITERATIONS_GENETIC, crossover_probability=0.9, crossover_strategy="exponential", eta_c=None, @@ -364,7 +364,7 @@ def pygmo_sga( param_s = 2 algo_specific_options = { - "gen": int(stopping_max_iterations), + "gen": int(stopping_maxiter), "cr": crossover_probability, "eta_c": eta_c, "m": mutation_probability, @@ -409,7 +409,7 @@ def pygmo_sade( seed=None, discard_start_params=False, jde=True, - stopping_max_iterations=STOPPING_MAX_ITERATIONS_GENETIC, + stopping_maxiter=STOPPING_MAX_ITERATIONS_GENETIC, mutation_variant="rand/1/exp", keep_adapted_params=False, ftol=1e-6, @@ -451,7 +451,7 @@ def pygmo_sade( ) algo_specific_options = { - "gen": int(stopping_max_iterations), + "gen": int(stopping_maxiter), "variant": mutation_variant, "variant_adptv": 1 if jde else 2, "ftol": ftol, @@ -492,7 +492,7 @@ def pygmo_cmaes( population_size=None, seed=None, discard_start_params=False, - stopping_max_iterations=STOPPING_MAX_ITERATIONS_GENETIC, + stopping_maxiter=STOPPING_MAX_ITERATIONS_GENETIC, backward_horizon=None, variance_loss_compensation=None, learning_rate_rank_one_update=None, @@ -515,7 +515,7 @@ def pygmo_cmaes( ) algo_specific_options = { - "gen": int(stopping_max_iterations), + "gen": int(stopping_maxiter), "cc": _replace_none(var=backward_horizon, none_value=-1.0), "cs": _replace_none(var=variance_loss_compensation, none_value=-1.0), "c1": _replace_none(var=learning_rate_rank_one_update, none_value=-1.0), @@ -621,7 +621,7 @@ def pygmo_pso( population_size=None, seed=None, discard_start_params=False, - stopping_max_iterations=STOPPING_MAX_ITERATIONS_GENETIC, + stopping_maxiter=STOPPING_MAX_ITERATIONS_GENETIC, omega=0.7298, force_of_previous_best=2.05, force_of_best_in_neighborhood=2.05, @@ -667,7 +667,7 @@ def pygmo_pso( } algo_specific_options = { - "gen": int(stopping_max_iterations), + "gen": int(stopping_maxiter), "omega": omega, "eta1": force_of_previous_best, "eta2": force_of_best_in_neighborhood, @@ -715,7 +715,7 @@ def pygmo_pso_gen( n_cores=1, seed=None, discard_start_params=False, - stopping_max_iterations=STOPPING_MAX_ITERATIONS_GENETIC, + stopping_maxiter=STOPPING_MAX_ITERATIONS_GENETIC, omega=0.7298, force_of_previous_best=2.05, force_of_best_in_neighborhood=2.05, @@ -762,7 +762,7 @@ def pygmo_pso_gen( ) algo_specific_options = { - "gen": int(stopping_max_iterations), + "gen": int(stopping_maxiter), "omega": omega, "eta1": force_of_previous_best, "eta2": force_of_best_in_neighborhood, @@ -865,7 +865,7 @@ def pygmo_xnes( population_size=None, seed=None, discard_start_params=False, - stopping_max_iterations=STOPPING_MAX_ITERATIONS_GENETIC, + stopping_maxiter=STOPPING_MAX_ITERATIONS_GENETIC, learning_rate_mean_update=1.0, learning_rate_step_size_update=None, learning_rate_cov_matrix_update=None, @@ -887,7 +887,7 @@ def pygmo_xnes( ) algo_specific_options = { - "gen": int(stopping_max_iterations), + "gen": int(stopping_maxiter), "eta_mu": _replace_none(learning_rate_mean_update, -1), "eta_sigma": _replace_none(learning_rate_step_size_update, -1), "eta_b": _replace_none(learning_rate_cov_matrix_update, -1), @@ -931,7 +931,7 @@ def pygmo_gwo( population_size=None, seed=None, discard_start_params=False, - stopping_max_iterations=STOPPING_MAX_ITERATIONS_GENETIC, + stopping_maxiter=STOPPING_MAX_ITERATIONS_GENETIC, ): """Minimize a scalar function using the Grey Wolf Optimizer. @@ -948,7 +948,7 @@ def pygmo_gwo( population_size=population_size, seed=seed, discard_start_params=discard_start_params, - algo_specific_options={"gen": int(stopping_max_iterations)}, + algo_specific_options={"gen": int(stopping_maxiter)}, ) res = _minimize_pygmo( @@ -978,7 +978,7 @@ def pygmo_compass_search( population_size=None, seed=None, discard_start_params=False, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS_GLOBAL, + stopping_maxfun=STOPPING_MAXFUN_GLOBAL, start_range=0.1, stop_range=0.01, reduction_coeff=0.5, @@ -1000,7 +1000,7 @@ def pygmo_compass_search( population_size = 100 algo_specific_options = { - "max_fevals": stopping_max_criterion_evaluations, + "max_fevals": stopping_maxfun, "start_range": start_range, "stop_range": stop_range, "reduction_coeff": reduction_coeff, @@ -1039,7 +1039,7 @@ def pygmo_ihs( population_size=None, seed=None, discard_start_params=False, - stopping_max_iterations=STOPPING_MAX_ITERATIONS_GENETIC, + stopping_maxiter=STOPPING_MAX_ITERATIONS_GENETIC, choose_from_memory_probability=0.85, min_pitch_adjustment_rate=0.35, max_pitch_adjustment_rate=0.99, @@ -1062,7 +1062,7 @@ def pygmo_ihs( ) algo_specific_options = { - "gen": int(stopping_max_iterations), + "gen": int(stopping_maxiter), "phmcr": choose_from_memory_probability, "ppar_min": min_pitch_adjustment_rate, "ppar_max": max_pitch_adjustment_rate, @@ -1104,7 +1104,7 @@ def pygmo_de1220( seed=None, discard_start_params=False, jde=True, - stopping_max_iterations=STOPPING_MAX_ITERATIONS_GENETIC, + stopping_maxiter=STOPPING_MAX_ITERATIONS_GENETIC, allowed_variants=None, keep_adapted_params=False, ftol=1e-6, @@ -1151,7 +1151,7 @@ def pygmo_de1220( ) algo_specific_options = { - "gen": int(stopping_max_iterations), + "gen": int(stopping_maxiter), "variant_adptv": 1 if jde else 2, "ftol": ftol, "xtol": xtol, diff --git a/src/optimagic/optimizers/scipy_optimizers.py b/src/optimagic/optimizers/scipy_optimizers.py index 608e04146..602367188 100644 --- a/src/optimagic/optimizers/scipy_optimizers.py +++ b/src/optimagic/optimizers/scipy_optimizers.py @@ -42,19 +42,19 @@ from optimagic.batch_evaluators import process_batch_evaluator from optimagic.decorators import mark_minimizer from optimagic.optimization.algo_options import ( - CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - CONVERGENCE_ABSOLUTE_GRADIENT_TOLERANCE, - CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - CONVERGENCE_RELATIVE_GRADIENT_TOLERANCE, - CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - CONVERGENCE_SECOND_BEST_ABSOLUTE_CRITERION_TOLERANCE, - CONVERGENCE_SECOND_BEST_ABSOLUTE_PARAMS_TOLERANCE, + CONVERGENCE_FTOL_ABS, + CONVERGENCE_GTOL_ABS, + CONVERGENCE_XTOL_ABS, + CONVERGENCE_FTOL_REL, + CONVERGENCE_GTOL_REL, + CONVERGENCE_XTOL_REL, + CONVERGENCE_SECOND_BEST_FTOL_ABS, + CONVERGENCE_SECOND_BEST_XTOL_ABS, LIMITED_MEMORY_STORAGE_LENGTH, MAX_LINE_SEARCH_STEPS, - STOPPING_MAX_CRITERION_EVALUATIONS, - STOPPING_MAX_CRITERION_EVALUATIONS_GLOBAL, - STOPPING_MAX_ITERATIONS, + STOPPING_MAXFUN, + STOPPING_MAXFUN_GLOBAL, + STOPPING_MAXITER, ) from optimagic.parameters.nonlinear_constraints import ( equality_as_inequality_constraints, @@ -70,10 +70,10 @@ def scipy_lbfgsb( lower_bounds, upper_bounds, *, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_absolute_gradient_tolerance=CONVERGENCE_ABSOLUTE_GRADIENT_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, - stopping_max_iterations=STOPPING_MAX_ITERATIONS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_gtol_abs=CONVERGENCE_GTOL_ABS, + stopping_maxfun=STOPPING_MAXFUN, + stopping_maxiter=STOPPING_MAXITER, limited_memory_storage_length=LIMITED_MEMORY_STORAGE_LENGTH, max_line_search_steps=MAX_LINE_SEARCH_STEPS, ): @@ -85,10 +85,10 @@ def scipy_lbfgsb( """ options = { "maxcor": limited_memory_storage_length, - "ftol": convergence_relative_criterion_tolerance, - "gtol": convergence_absolute_gradient_tolerance, - "maxfun": stopping_max_criterion_evaluations, - "maxiter": stopping_max_iterations, + "ftol": convergence_ftol_rel, + "gtol": convergence_gtol_abs, + "maxfun": stopping_maxfun, + "maxiter": stopping_maxiter, "maxls": max_line_search_steps, } res = scipy.optimize.minimize( @@ -112,8 +112,8 @@ def scipy_slsqp( upper_bounds, *, nonlinear_constraints=(), - convergence_absolute_criterion_tolerance=CONVERGENCE_SECOND_BEST_ABSOLUTE_CRITERION_TOLERANCE, # noqa: E501 - stopping_max_iterations=STOPPING_MAX_ITERATIONS, + convergence_ftol_abs=CONVERGENCE_SECOND_BEST_FTOL_ABS, # noqa: E501 + stopping_maxiter=STOPPING_MAXITER, ): """Minimize a scalar function of one or more variables using the SLSQP algorithm. @@ -122,8 +122,8 @@ def scipy_slsqp( """ options = { - "maxiter": stopping_max_iterations, - "ftol": convergence_absolute_criterion_tolerance, + "maxiter": stopping_maxiter, + "ftol": convergence_ftol_abs, } res = scipy.optimize.minimize( @@ -146,10 +146,10 @@ def scipy_neldermead( lower_bounds, upper_bounds, *, - stopping_max_iterations=STOPPING_MAX_ITERATIONS, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, - convergence_absolute_criterion_tolerance=CONVERGENCE_SECOND_BEST_ABSOLUTE_CRITERION_TOLERANCE, # noqa: E501 - convergence_absolute_params_tolerance=CONVERGENCE_SECOND_BEST_ABSOLUTE_PARAMS_TOLERANCE, # noqa: E501 + stopping_maxiter=STOPPING_MAXITER, + stopping_maxfun=STOPPING_MAXFUN, + convergence_ftol_abs=CONVERGENCE_SECOND_BEST_FTOL_ABS, # noqa: E501 + convergence_xtol_abs=CONVERGENCE_SECOND_BEST_XTOL_ABS, # noqa: E501 adaptive=False, ): """Minimize a scalar function using the Nelder-Mead algorithm. @@ -159,12 +159,12 @@ def scipy_neldermead( """ options = { - "maxiter": stopping_max_iterations, - "maxfev": stopping_max_criterion_evaluations, + "maxiter": stopping_maxiter, + "maxfev": stopping_maxfun, # both tolerances seem to have to be fulfilled for Nelder-Mead to converge. # if not both are specified it does not converge in our tests. - "xatol": convergence_absolute_params_tolerance, - "fatol": convergence_absolute_criterion_tolerance, + "xatol": convergence_xtol_abs, + "fatol": convergence_ftol_abs, "adaptive": adaptive, } @@ -186,10 +186,10 @@ def scipy_powell( lower_bounds, upper_bounds, *, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, - stopping_max_iterations=STOPPING_MAX_ITERATIONS, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + stopping_maxfun=STOPPING_MAXFUN, + stopping_maxiter=STOPPING_MAXITER, ): """Minimize a scalar function using the modified Powell method. @@ -198,10 +198,10 @@ def scipy_powell( """ options = { - "xtol": convergence_relative_params_tolerance, - "ftol": convergence_relative_criterion_tolerance, - "maxfev": stopping_max_criterion_evaluations, - "maxiter": stopping_max_iterations, + "xtol": convergence_xtol_rel, + "ftol": convergence_ftol_rel, + "maxfev": stopping_maxfun, + "maxiter": stopping_maxiter, } res = scipy.optimize.minimize( @@ -220,8 +220,8 @@ def scipy_bfgs( criterion_and_derivative, x, *, - convergence_absolute_gradient_tolerance=CONVERGENCE_ABSOLUTE_GRADIENT_TOLERANCE, - stopping_max_iterations=STOPPING_MAX_ITERATIONS, + convergence_gtol_abs=CONVERGENCE_GTOL_ABS, + stopping_maxiter=STOPPING_MAXITER, norm=np.inf, ): """Minimize a scalar function of one or more variables using the BFGS algorithm. @@ -231,8 +231,8 @@ def scipy_bfgs( """ options = { - "gtol": convergence_absolute_gradient_tolerance, - "maxiter": stopping_max_iterations, + "gtol": convergence_gtol_abs, + "maxiter": stopping_maxiter, "norm": norm, } @@ -252,8 +252,8 @@ def scipy_conjugate_gradient( criterion_and_derivative, x, *, - convergence_absolute_gradient_tolerance=CONVERGENCE_ABSOLUTE_GRADIENT_TOLERANCE, - stopping_max_iterations=STOPPING_MAX_ITERATIONS, + convergence_gtol_abs=CONVERGENCE_GTOL_ABS, + stopping_maxiter=STOPPING_MAXITER, norm=np.inf, ): """Minimize a function using a nonlinear conjugate gradient algorithm. @@ -263,8 +263,8 @@ def scipy_conjugate_gradient( """ options = { - "gtol": convergence_absolute_gradient_tolerance, - "maxiter": stopping_max_iterations, + "gtol": convergence_gtol_abs, + "maxiter": stopping_maxiter, "norm": norm, } @@ -284,8 +284,8 @@ def scipy_newton_cg( criterion_and_derivative, x, *, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - stopping_max_iterations=STOPPING_MAX_ITERATIONS, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + stopping_maxiter=STOPPING_MAXITER, ): """Minimize a scalar function using Newton's conjugate gradient algorithm. @@ -294,8 +294,8 @@ def scipy_newton_cg( """ options = { - "xtol": convergence_relative_params_tolerance, - "maxiter": stopping_max_iterations, + "xtol": convergence_xtol_rel, + "maxiter": stopping_maxiter, } res = scipy.optimize.minimize( @@ -315,8 +315,8 @@ def scipy_cobyla( x, *, nonlinear_constraints=(), - stopping_max_iterations=STOPPING_MAX_ITERATIONS, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, + stopping_maxiter=STOPPING_MAXITER, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, trustregion_initial_radius=None, ): """Minimize a scalar function of one or more variables using the COBYLA algorithm. @@ -328,7 +328,7 @@ def scipy_cobyla( if trustregion_initial_radius is None: trustregion_initial_radius = calculate_trustregion_initial_radius(x) - options = {"maxiter": stopping_max_iterations, "rhobeg": trustregion_initial_radius} + options = {"maxiter": stopping_maxiter, "rhobeg": trustregion_initial_radius} # cannot handle equality constraints nonlinear_constraints = equality_as_inequality_constraints(nonlinear_constraints) @@ -339,7 +339,7 @@ def scipy_cobyla( method="COBYLA", constraints=nonlinear_constraints, options=options, - tol=convergence_relative_params_tolerance, + tol=convergence_xtol_rel, ) return process_scipy_result(res) @@ -352,10 +352,10 @@ def scipy_truncated_newton( lower_bounds, upper_bounds, *, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, - convergence_absolute_criterion_tolerance=CONVERGENCE_ABSOLUTE_CRITERION_TOLERANCE, - convergence_absolute_params_tolerance=CONVERGENCE_ABSOLUTE_PARAMS_TOLERANCE, - convergence_absolute_gradient_tolerance=CONVERGENCE_ABSOLUTE_GRADIENT_TOLERANCE, + stopping_maxfun=STOPPING_MAXFUN, + convergence_ftol_abs=CONVERGENCE_FTOL_ABS, + convergence_xtol_abs=CONVERGENCE_XTOL_ABS, + convergence_gtol_abs=CONVERGENCE_GTOL_ABS, func_min_estimate=0, max_hess_evaluations_per_iteration=-1, max_step_for_line_search=0, @@ -372,12 +372,12 @@ def scipy_truncated_newton( options = { # scipy/optimize/tnc/tnc.c::809 and 844 show that ftol is the # absolute criterion tolerance - "ftol": convergence_absolute_criterion_tolerance, + "ftol": convergence_ftol_abs, # scipy/optimize/tnc/tnc.c::856 show sthat xtol is the absolute parameter # tolerance - "xtol": convergence_absolute_params_tolerance, - "gtol": convergence_absolute_gradient_tolerance, - "maxfun": stopping_max_criterion_evaluations, + "xtol": convergence_xtol_abs, + "gtol": convergence_gtol_abs, + "maxfun": stopping_maxfun, "maxCGit": max_hess_evaluations_per_iteration, "stepmx": max_step_for_line_search, "minfev": func_min_estimate, @@ -406,9 +406,9 @@ def scipy_trust_constr( upper_bounds, *, nonlinear_constraints=(), - convergence_absolute_gradient_tolerance=1e-08, - convergence_relative_params_tolerance=CONVERGENCE_RELATIVE_PARAMS_TOLERANCE, - stopping_max_iterations=STOPPING_MAX_ITERATIONS, + convergence_gtol_abs=1e-08, + convergence_xtol_rel=CONVERGENCE_XTOL_REL, + stopping_maxiter=STOPPING_MAXITER, trustregion_initial_radius=None, ): """Minimize a scalar function of one or more variables subject to constraints. @@ -421,9 +421,9 @@ def scipy_trust_constr( trustregion_initial_radius = calculate_trustregion_initial_radius(x) options = { - "gtol": convergence_absolute_gradient_tolerance, - "maxiter": stopping_max_iterations, - "xtol": convergence_relative_params_tolerance, + "gtol": convergence_gtol_abs, + "maxiter": stopping_maxiter, + "xtol": convergence_xtol_rel, "initial_tr_radius": trustregion_initial_radius, } @@ -492,9 +492,9 @@ def _scipy_least_squares( lower_bounds, upper_bounds, *, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_relative_gradient_tolerance=CONVERGENCE_RELATIVE_GRADIENT_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_gtol_rel=CONVERGENCE_GTOL_REL, + stopping_maxfun=STOPPING_MAXFUN, relative_step_size_diff_approx=None, tr_solver=None, tr_solver_options=None, @@ -516,9 +516,9 @@ def _scipy_least_squares( jac=derivative, # Don't use get_scipy_bounds, b.c. least_squares uses np.inf bounds=(lower_bounds, upper_bounds), - max_nfev=stopping_max_criterion_evaluations, - ftol=convergence_relative_criterion_tolerance, - gtol=convergence_relative_gradient_tolerance, + max_nfev=stopping_maxfun, + ftol=convergence_ftol_rel, + gtol=convergence_gtol_rel, method=method, diff_step=relative_step_size_diff_approx, tr_solver=tr_solver, @@ -547,9 +547,9 @@ def scipy_ls_lm( derivative, x, *, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - convergence_relative_gradient_tolerance=CONVERGENCE_RELATIVE_GRADIENT_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + convergence_gtol_rel=CONVERGENCE_GTOL_REL, + stopping_maxfun=STOPPING_MAXFUN, relative_step_size_diff_approx=None, tr_solver=None, tr_solver_options=None, @@ -563,9 +563,9 @@ def scipy_ls_lm( fun=criterion, x0=x, jac=derivative, - max_nfev=stopping_max_criterion_evaluations, - ftol=convergence_relative_criterion_tolerance, - gtol=convergence_relative_gradient_tolerance, + max_nfev=stopping_maxfun, + ftol=convergence_ftol_rel, + gtol=convergence_gtol_rel, method="lm", diff_step=relative_step_size_diff_approx, tr_solver=tr_solver, @@ -689,15 +689,15 @@ def scipy_differential_evolution( nonlinear_constraints, *, strategy="best1bin", - stopping_max_iterations=STOPPING_MAX_CRITERION_EVALUATIONS_GLOBAL, + stopping_maxiter=STOPPING_MAXFUN_GLOBAL, population_size_multiplier=15, - convergence_relative_criterion_tolerance=0.01, + convergence_ftol_rel=0.01, mutation_constant=(0.5, 1), recombination_constant=0.7, seed=None, polish=True, sampling_method="latinhypercube", - convergence_absolute_criterion_tolerance=CONVERGENCE_SECOND_BEST_ABSOLUTE_CRITERION_TOLERANCE, # noqa: E501 + convergence_ftol_abs=CONVERGENCE_SECOND_BEST_FTOL_ABS, # noqa: E501 n_cores=1, batch_evaluator="joblib", ): @@ -712,15 +712,15 @@ def scipy_differential_evolution( func=criterion, bounds=_get_scipy_bounds(lower_bounds, upper_bounds), strategy=strategy, - maxiter=stopping_max_iterations, + maxiter=stopping_maxiter, popsize=population_size_multiplier, - tol=convergence_relative_criterion_tolerance, + tol=convergence_ftol_rel, mutation=mutation_constant, recombination=recombination_constant, seed=seed, polish=polish, init=sampling_method, - atol=convergence_absolute_criterion_tolerance, + atol=convergence_ftol_abs, updating="deferred", workers=workers, constraints=_get_scipy_constraints(nonlinear_constraints), @@ -746,8 +746,8 @@ def scipy_shgo( max_sampling_evaluations=None, convergence_minimum_criterion_value=None, convergence_minimum_criterion_tolerance=1e-4, - stopping_max_iterations=None, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS_GLOBAL, + stopping_maxiter=None, + stopping_maxfun=STOPPING_MAXFUN_GLOBAL, stopping_max_processing_time=None, minimum_homology_group_rank_differential=None, symmetry=False, @@ -783,8 +783,8 @@ def scipy_shgo( "maxfev": max_sampling_evaluations, "f_min": convergence_minimum_criterion_value, "f_tol": convergence_minimum_criterion_tolerance, - "maxiter": stopping_max_iterations, - "maxev": stopping_max_criterion_evaluations, + "maxiter": stopping_maxiter, + "maxev": stopping_maxfun, "maxtime": stopping_max_processing_time, "minhgrd": minimum_homology_group_rank_differential, "symmetry": symmetry, @@ -819,14 +819,14 @@ def scipy_dual_annealing( upper_bounds, x, *, - stopping_max_iterations=STOPPING_MAX_CRITERION_EVALUATIONS_GLOBAL, + stopping_maxiter=STOPPING_MAXFUN_GLOBAL, local_algorithm="L-BFGS-B", local_algo_options=None, initial_temperature=5230.0, restart_temperature_ratio=2e-05, visit=2.62, accept=-5.0, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, + stopping_maxfun=STOPPING_MAXFUN, seed=None, no_local_search=False, ): @@ -848,13 +848,13 @@ def scipy_dual_annealing( res = scipy.optimize.dual_annealing( func=criterion, bounds=_get_scipy_bounds(lower_bounds, upper_bounds), - maxiter=stopping_max_iterations, + maxiter=stopping_maxiter, minimizer_kwargs=minimizer_kwargs, initial_temp=initial_temperature, restart_temp_ratio=restart_temperature_ratio, visit=visit, accept=accept, - maxfun=stopping_max_criterion_evaluations, + maxfun=stopping_maxfun, seed=seed, no_local_search=no_local_search, x0=x, @@ -870,9 +870,9 @@ def scipy_direct( upper_bounds, x, # noqa: ARG001 *, - convergence_relative_criterion_tolerance=CONVERGENCE_RELATIVE_CRITERION_TOLERANCE, - stopping_max_criterion_evaluations=STOPPING_MAX_CRITERION_EVALUATIONS, - stopping_max_iterations=STOPPING_MAX_CRITERION_EVALUATIONS_GLOBAL, + convergence_ftol_rel=CONVERGENCE_FTOL_REL, + stopping_maxfun=STOPPING_MAXFUN, + stopping_maxiter=STOPPING_MAXFUN_GLOBAL, locally_biased=True, convergence_minimum_criterion_value=-np.inf, convergence_minimum_criterion_tolerance=1e-4, @@ -889,9 +889,9 @@ def scipy_direct( res = scipy.optimize.direct( func=criterion, bounds=_get_scipy_bounds(lower_bounds, upper_bounds), - eps=convergence_relative_criterion_tolerance, - maxfun=stopping_max_criterion_evaluations, - maxiter=stopping_max_iterations, + eps=convergence_ftol_rel, + maxfun=stopping_maxfun, + maxiter=stopping_maxiter, locally_biased=locally_biased, f_min=convergence_minimum_criterion_value, f_min_rtol=convergence_minimum_criterion_tolerance, diff --git a/src/optimagic/optimizers/tao_optimizers.py b/src/optimagic/optimizers/tao_optimizers.py index f7f5039b2..64c221e81 100644 --- a/src/optimagic/optimizers/tao_optimizers.py +++ b/src/optimagic/optimizers/tao_optimizers.py @@ -9,10 +9,10 @@ from optimagic.decorators import mark_minimizer from optimagic.exceptions import NotInstalledError from optimagic.optimization.algo_options import ( - CONVERGENCE_ABSOLUTE_GRADIENT_TOLERANCE, - CONVERGENCE_RELATIVE_GRADIENT_TOLERANCE, - CONVERGENCE_SCALED_GRADIENT_TOLERANCE, - STOPPING_MAX_ITERATIONS, + CONVERGENCE_GTOL_ABS, + CONVERGENCE_GTOL_REL, + CONVERGENCE_GTOL_SCALED, + STOPPING_MAXITER, ) from optimagic.utilities import calculate_trustregion_initial_radius @@ -32,11 +32,11 @@ def tao_pounders( lower_bounds, upper_bounds, *, - convergence_absolute_gradient_tolerance=CONVERGENCE_ABSOLUTE_GRADIENT_TOLERANCE, - convergence_relative_gradient_tolerance=CONVERGENCE_RELATIVE_GRADIENT_TOLERANCE, - convergence_scaled_gradient_tolerance=CONVERGENCE_SCALED_GRADIENT_TOLERANCE, + convergence_gtol_abs=CONVERGENCE_GTOL_ABS, + convergence_gtol_rel=CONVERGENCE_GTOL_REL, + convergence_gtol_scaled=CONVERGENCE_GTOL_SCALED, trustregion_initial_radius=None, - stopping_max_iterations=STOPPING_MAX_ITERATIONS, + stopping_maxiter=STOPPING_MAXITER, ): r"""Minimize a function using the POUNDERs algorithm. @@ -102,21 +102,9 @@ def func_tao(tao, x, resid_out): # noqa: ARG001 # scaled_gradient_tolerance manually we manually set absolute_gradient_tolerance and # or relative_gradient_tolerance to zero once a subset of these two is turned off # and scaled_gradient_tolerance is still turned on. - default_gatol = ( - convergence_absolute_gradient_tolerance - if convergence_absolute_gradient_tolerance - else -1 - ) - default_gttol = ( - convergence_scaled_gradient_tolerance - if convergence_scaled_gradient_tolerance - else -1 - ) - default_grtol = ( - convergence_relative_gradient_tolerance - if convergence_relative_gradient_tolerance - else -1 - ) + default_gatol = convergence_gtol_abs if convergence_gtol_abs else -1 + default_gttol = convergence_gtol_scaled if convergence_gtol_scaled else -1 + default_grtol = convergence_gtol_rel if convergence_gtol_rel else -1 # Set tolerances for default convergence tests. tao.setTolerances( gatol=default_gatol, @@ -126,28 +114,18 @@ def func_tao(tao, x, resid_out): # noqa: ARG001 # Set user defined convergence tests. Beware that specifying multiple tests could # overwrite others or lead to unclear behavior. - if stopping_max_iterations is not None: - tao.setConvergenceTest(functools.partial(_max_iters, stopping_max_iterations)) - elif ( - convergence_scaled_gradient_tolerance is False - and convergence_absolute_gradient_tolerance is False - ): - tao.setConvergenceTest( - functools.partial(_grtol_conv, convergence_relative_gradient_tolerance) - ) - elif ( - convergence_relative_gradient_tolerance is False - and convergence_scaled_gradient_tolerance is False - ): - tao.setConvergenceTest( - functools.partial(_gatol_conv, convergence_absolute_gradient_tolerance) - ) - elif convergence_scaled_gradient_tolerance is False: + if stopping_maxiter is not None: + tao.setConvergenceTest(functools.partial(_max_iters, stopping_maxiter)) + elif convergence_gtol_scaled is False and convergence_gtol_abs is False: + tao.setConvergenceTest(functools.partial(_grtol_conv, convergence_gtol_rel)) + elif convergence_gtol_rel is False and convergence_gtol_scaled is False: + tao.setConvergenceTest(functools.partial(_gatol_conv, convergence_gtol_abs)) + elif convergence_gtol_scaled is False: tao.setConvergenceTest( functools.partial( _grtol_gatol_conv, - convergence_relative_gradient_tolerance, - convergence_absolute_gradient_tolerance, + convergence_gtol_rel, + convergence_gtol_abs, ) ) diff --git a/tests/estimagic/test_estimate_ml.py b/tests/estimagic/test_estimate_ml.py index 5df2002a2..2604b4de6 100644 --- a/tests/estimagic/test_estimate_ml.py +++ b/tests/estimagic/test_estimate_ml.py @@ -265,7 +265,7 @@ def test_estimate_ml_with_logit_constraints( optimize_options = { "algorithm": "scipy_lbfgsb", - "algo_options": {"convergence.relative_criterion_tolerance": 1e-12}, + "algo_options": {"convergence.ftol_rel": 1e-12}, } if "fun_and_jac" in optimize_options: diff --git a/tests/optimagic/optimization/test_multistart.py b/tests/optimagic/optimization/test_multistart.py index 75baac237..6806af2e5 100644 --- a/tests/optimagic/optimization/test_multistart.py +++ b/tests/optimagic/optimization/test_multistart.py @@ -226,7 +226,7 @@ def ackley(x): "params": np.full(dim, -10), "lower_bounds": np.full(dim, -32), "upper_bounds": np.full(dim, 32), - "algo_options": {"stopping.max_criterion_evaluations": 1000}, + "algo_options": {"stopping.maxfun": 1000}, } minimize( diff --git a/tests/optimagic/optimization/test_with_constraints.py b/tests/optimagic/optimization/test_with_constraints.py index 6110387b6..733b29d14 100644 --- a/tests/optimagic/optimization/test_with_constraints.py +++ b/tests/optimagic/optimization/test_with_constraints.py @@ -173,7 +173,7 @@ def test_constrained_minimization( algorithm=algorithm, jac=derivative, constraints=constraints, - algo_options={"convergence.relative_criterion_tolerance": 1e-12}, + algo_options={"convergence.ftol_rel": 1e-12}, ) if params_type == "pandas": @@ -213,7 +213,7 @@ def test_three_independent_constraints(): params=params, algorithm="scipy_lbfgsb", constraints=constraints, - algo_options={"convergence.relative_criterion_tolerance": 1e-12}, + algo_options={"convergence.ftol_rel": 1e-12}, ) expected = np.array([0] * 4 + [4, 5] + [0] + [7.5] * 2 + [0]) diff --git a/tests/optimagic/optimizers/test_bhhh.py b/tests/optimagic/optimizers/test_bhhh.py index 789a622b8..a5dbd1168 100644 --- a/tests/optimagic/optimizers/test_bhhh.py +++ b/tests/optimagic/optimizers/test_bhhh.py @@ -129,8 +129,8 @@ def test_maximum_likelihood(criterion_and_derivative, result_statsmodels, reques result_bhhh = bhhh_internal( criterion_and_derivative, x=x, - convergence_absolute_gradient_tolerance=1e-8, - stopping_max_iterations=200, + convergence_gtol_abs=1e-8, + stopping_maxiter=200, ) aaae(result_bhhh["solution_x"], result_expected.params, decimal=4) diff --git a/tests/optimagic/optimizers/test_fides_options.py b/tests/optimagic/optimizers/test_fides_options.py index 5a0c65ab2..389f83f77 100644 --- a/tests/optimagic/optimizers/test_fides_options.py +++ b/tests/optimagic/optimizers/test_fides_options.py @@ -22,11 +22,11 @@ {"hessian_update_strategy": "sr1"}, {"hessian_update_strategy": "DFP"}, {"hessian_update_strategy": "bb"}, - {"convergence_relative_criterion_tolerance": 1e-6}, - {"convergence_absolute_params_tolerance": 1e-6}, - {"convergence_absolute_gradient_tolerance": 1e-6}, - {"convergence_relative_gradient_tolerance": 1e-6}, - {"stopping_max_iterations": 100}, + {"convergence_ftol_rel": 1e-6}, + {"convergence_xtol_abs": 1e-6}, + {"convergence_gtol_abs": 1e-6}, + {"convergence_gtol_rel": 1e-6}, + {"stopping_maxiter": 100}, {"stopping_max_seconds": 200}, {"trustregion_initial_radius": 20, "trustregion_stepback_strategy": "truncate"}, {"trustregion_subspace_dimension": "full"}, @@ -81,7 +81,7 @@ def test_fides_stop_after_one_iteration(): x=np.array([1, -5, 3]), lower_bounds=np.array([-10, -10, -10]), upper_bounds=np.array([10, 10, 10]), - stopping_max_iterations=1, + stopping_maxiter=1, ) assert not res["success"] assert res["n_iterations"] == 1 diff --git a/tests/optimagic/optimizers/test_ipopt_options.py b/tests/optimagic/optimizers/test_ipopt_options.py index d50bab776..6f9aba809 100644 --- a/tests/optimagic/optimizers/test_ipopt_options.py +++ b/tests/optimagic/optimizers/test_ipopt_options.py @@ -8,8 +8,8 @@ test_cases = [ {}, - {"convergence_relative_criterion_tolerance": 1e-7}, - {"stopping_max_iterations": 1_100_000}, + {"convergence_ftol_rel": 1e-7}, + {"stopping_maxiter": 1_100_000}, {"mu_target": 1e-8}, {"s_max": 200}, {"stopping_max_wall_time_seconds": 200}, diff --git a/tests/optimagic/optimizers/test_neldermead.py b/tests/optimagic/optimizers/test_neldermead.py index d04727677..62ece7a81 100644 --- a/tests/optimagic/optimizers/test_neldermead.py +++ b/tests/optimagic/optimizers/test_neldermead.py @@ -128,7 +128,7 @@ def test_fides_stop_after_one_iteration(): res = neldermead_parallel( criterion=sphere, x=np.array([1, -5, 3]), - stopping_max_iterations=1, + stopping_maxiter=1, ) assert not res["success"] assert res["n_iterations"] == 1 From 4eda2de3bec52e8907d359d4900e62361268aa00 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Thu, 18 Jul 2024 19:16:22 +0200 Subject: [PATCH 16/25] Move some default algo options to nag optimizers. --- .pre-commit-config.yaml | 2 - src/optimagic/optimization/algo_options.py | 330 --------------------- src/optimagic/optimizers/nag_optimizers.py | 327 ++++++++++++++++++-- 3 files changed, 306 insertions(+), 353 deletions(-) diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml index 43ba1e7cf..ab79e1952 100644 --- a/.pre-commit-config.yaml +++ b/.pre-commit-config.yaml @@ -50,8 +50,6 @@ repos: - id: trailing-whitespace exclude: docs/ - id: check-ast - - id: check-docstring-first - exclude: src/optimagic/optimization/algo_options.py - repo: https://github.com/adrienverge/yamllint.git rev: v1.35.1 hooks: diff --git a/src/optimagic/optimization/algo_options.py b/src/optimagic/optimization/algo_options.py index 5c854bc7e..425caebbb 100644 --- a/src/optimagic/optimization/algo_options.py +++ b/src/optimagic/optimization/algo_options.py @@ -1,18 +1,5 @@ import numpy as np -""" -The order is the following: - -1. Convergence and Stopping Criteria -2. Trust Region Parameters -3. Other Numerical Algorithm Group Tuning Parameters - -""" -""" -===================================================================================== -1. Stopping Criteria -===================================================================================== -""" CONVERGENCE_FTOL_REL = 2e-9 """float: Stop when the relative improvement between two iterations is below this. @@ -79,20 +66,6 @@ """ -CONVERGENCE_NOISE_CORRECTED_FTOL = 1.0 -"""float: Stop when the evaluations on the set of interpolation points all fall within - this factor of the noise level. The default is 1, i.e. when all evaluations are - within the noise level. If you want to not use this criterion but still flag your - criterion function as noisy, set this tolerance to 0.0. - - .. warning:: - Very small values, as in most other tolerances don't make sense here. - -""" - -CONVERGENCE_MINIMAL_TRUSTREGION_RADIUS_TOLERANCE = 1e-8 -"""float: Stop when the lower trust region radius falls below this value.""" - STOPPING_MAXFUN = 1_000_000 """int: @@ -136,36 +109,6 @@ """ -CONVERGENCE_SLOW_PROGRESS = { - "threshold_to_characterize_as_slow": 1e-8, - "max_insufficient_improvements": None, - "comparison_period": 5, -} -"""dict: Specification of when to terminate or reset the optimization because of only - slow improvements. This is similar to an absolute criterion tolerance only that - instead of a single improvement the average over several iterations must be small. - - Possible entries are: - threshold_to_characterize_as_slow (float): Threshold whether an improvement - is insufficient. Note: the improvement is divided by the - ``comparison_period``. - So this is the required average improvement per iteration over the - comparison period. - max_insufficient_improvements (int): Number of consecutive - insufficient improvements before termination (or reset). Default is - ``20 * len(x)``. - comparison_period (int): - How many iterations to go back to calculate the improvement. - For example 5 would mean that each criterion evaluation is compared to the - criterion value from 5 iterations before. - -""" - -""" -===================================================================================== -2. Other Common Tuning Parameters for Optimization Algorithms -===================================================================================== -""" MAX_LINE_SEARCH_STEPS = 20 """int: Inspired by scipy L-BFGS-B.""" @@ -173,13 +116,6 @@ LIMITED_MEMORY_STORAGE_LENGTH = 10 """int: Taken from scipy L-BFGS-B.""" -THRESHOLD_FOR_SAFETY_STEP = 0.5 -r"""float: Threshold for when to call the safety step (:math:`\gamma_s`). - - :math:`\text{proposed step} \leq \text{threshold_for_safety_step} \cdot - \text{current_lower_trustregion_radius}`. - -""" CONSTRAINTS_ABSOLUTE_TOLERANCE = 1e-5 """float: Allowed tolerance of the equality and inequality constraints for values to be @@ -187,272 +123,6 @@ """ -""" -------------------------- -Trust Region Parameters -------------------------- -""" - -TRUSTREGION_THRESHOLD_SUCCESSFUL = 0.1 -"""float: Share of the predicted improvement that has to be achieved for a trust - region iteration to count as successful. - -""" - -TRUSTREGION_THRESHOLD_VERY_SUCCESSFUL = 0.7 -"""float: Share of predicted improvement that has to be achieved for a trust region - iteration to count as very successful.``criterion_noisy`` - -""" - -TRUSTREGION_SHRINKING_FACTOR_NOT_SUCCESSFUL = None -"""float: Ratio by which to shrink the upper trust region radius when realized - improvement does not match the ``threshold_successful``. The default is 0.98 - if the criterion is noisy and 0.5 else. - -""" - -TRUSTREGION_EXPANSION_FACTOR_SUCCESSFUL = 2.0 -r"""float: Ratio by which to expand the upper trust region radius :math:`\Delta_k` - in very successful iterations (:math:`\gamma_{inc}` in the notation of the paper). - -""" - -TRUSTREGION_EXPANSION_FACTOR_VERY_SUCCESSFUL = 4.0 -r"""float: Ratio of the proposed step ($\|s_k\|$) by which to expand the upper trust - region radius (:math:`\Delta_k`) in very successful iterations - (:math:`\overline{\gamma}_{inc}` in the notation of the paper). - -""" - -TRUSTREGION_SHRINKING_FACTOR_LOWER_RADIUS = None -r"""float: Ratio by which to shrink the lower trust region radius (:math:`\rho_k`) - (:math:`\alpha_1` in the notation of the paper). Default is 0.9 if - the criterion is noisy and 0.1 else. - -""" - -TRUSTREGION_SHRINKING_FACTOR_UPPER_RADIUS = None -r"""float: Ratio of the current lower trust region (:math:`\rho_k`) by which to shrink - the upper trust region radius (:math:`\Delta_k`) when the lower one is shrunk - (:math:`\alpha_2` in the notation of the paper). Default is 0.95 if the - criterion is noisy and 0.5 else.""" - -""" ---------------------------------------------- -Numerical Algorithm Group Tuning Parameters ---------------------------------------------- -""" - -INITIAL_DIRECTIONS = "coordinate" -"""string: How to draw the initial directions. Possible values are "coordinate" for - coordinate directions (the default) or "random". - -""" - -RANDOM_DIRECTIONS_ORTHOGONAL = True -"""bool: Whether to make randomly drawn initial directions orthogonal.""" - - -INTERPOLATION_ROUNDING_ERROR = 0.1 -r"""float: Internally, all the NAG algorithms store interpolation points with respect - to a base point :math:`x_b`; that is, we store :math:`\{y_t-x_b\}`, - which reduces the risk of roundoff errors. We shift :math:`x_b` to :math:`x_k` when - :math:`\text{proposed step} \leq \text{interpolation_rounding_error} \cdot - \|x_k-x_b\|`. - -""" - -CLIP_CRITERION_IF_OVERFLOWING = True -"""bool: Whether to clip the criterion to avoid ``OverflowError``.""" - - -TRUSTREGION_PRECONDITION_INTERPOLATION = True -"""bool: whether to scale the interpolation linear system to improve conditioning.""" - - -RESET_OPTIONS = { - "use_resets": None, - "minimal_trustregion_radius_tolerance_scaling_at_reset": 1.0, - "reset_type": "soft", - "move_center_at_soft_reset": True, - "reuse_criterion_value_at_hard_reset": True, - "max_iterations_without_new_best_after_soft_reset": None, - "auto_detect": True, - "auto_detect_history": 30, - "auto_detect_min_jacobian_increase": 0.015, - "auto_detect_min_correlations": 0.1, - "points_to_replace_at_soft_reset": 3, - "max_consecutive_unsuccessful_resets": 10, - # just bobyqa - "max_unsuccessful_resets": None, - "trust_region_scaling_at_unsuccessful_reset": None, - # just dfols - "max_interpolation_points": None, - "n_extra_interpolation_points_per_soft_reset": 0, - "n_extra_interpolation_points_per_hard_reset": 0, - "n_additional_extra_points_to_replace_per_reset": 0, -} -r"""dict: Options for reseting the optimization. - - Possible entries are: - - use_resets (bool): Whether to do resets when the lower trust - region radius (:math:`\rho_k`) reaches the stopping criterion - (:math:`\rho_{end}`), or (optionally) when all interpolation points are - within noise level. Default is ``True`` if the criterion is noisy. - minimal_trustregion_radius_tolerance_scaling_at_reset (float): Factor with - which the trust region stopping criterion is multiplied at each reset. - - reset_type (str): Whether to use "soft" or "hard" resets. Default is "soft". - - move_center_at_soft_reset (bool): Whether to move the trust region center - ($x_k$) to the best new point evaluated in stead of keeping it constant. - points_to_replace_at_soft_reset (int): Number of interpolation points to move - at each soft reset. - reuse_criterion_value_at_hard_reset (bool): Whether or not to recycle the - criterion value at the best iterate found when performing a hard reset. - This saves one criterion evaluation. - max_iterations_without_new_best_after_soft_reset (int): - The maximum number of successful steps in a given run where the new - criterion value is worse than the best value found in previous runs before - terminating. Default is ``max_criterion_evaluations``. - auto_detect (bool): Whether or not to - automatically determine when to reset. This is an additional condition - and resets can still be triggered by small upper trust region radius, etc. - There are two criteria used: upper trust region radius shrinkage - (no increases over the history, more decreases than no changes) and - changes in the model Jacobian (consistently increasing trend as measured - by slope and correlation coefficient of the line of best fit). - auto_detect_history (int): - How many iterations of model changes and trust region radii to store. - auto_detect_min_jacobian_increase (float): - Minimum rate of increase of the Jacobian over past iterations to cause a - reset. - auto_detect_min_correlations (float): - Minimum correlation of the Jacobian data set required to cause a reset. - max_consecutive_unsuccessful_resets (int): maximum number of consecutive - unsuccessful resets allowed (i.e. resets which did not outperform the - best known value from earlier runs). - - Only used when using nag_bobyqa: - - max_unsuccessful_resets (int): - number of total unsuccessful resets allowed. - Default is 20 if ``seek_global_optimum`` and else unrestricted. - trust_region_scaling_at_unsuccessful_reset (float): Factor by which to - expand the initial lower trust region radius (:math:`\rho_{beg}`) after - unsuccessful resets. Default is 1.1 if ``seek_global_optimum`` else 1. - - Only used when using nag_dfols: - - max_interpolation_points (int): Maximum allowed value of the number of - interpolation points. This is useful if the number of interpolation points - increases with each reset, e.g. when - ``n_extra_interpolation_points_per_soft_reset > 0``. The default is - ``n_interpolation_points``. - n_extra_interpolation_points_per_soft_reset (int): Number of points to add to - the interpolation set with each soft reset. - n_extra_interpolation_points_per_hard_reset (int): Number of points to add to - the interpolation set with each hard reset. - n_additional_extra_points_to_replace_per_reset (int): This parameter modifies - ``n_extra_points_to_replace_successful``. With each reset - ``n_extra_points_to_replace_successful`` is increased by this number. - -""" - - -TRUSTREGION_FAST_START_OPTIONS = { - "min_inital_points": None, - "method": "auto", - "scale_of_trustregion_step_perturbation": None, - "scale_of_jacobian_components_perturbation": 1e-2, - # the following will be growing.full_rank.min_sing_val - # but it not supported yet by DF-OLS. - "floor_of_jacobian_singular_values": 1, - "jacobian_max_condition_number": 1e8, - "geometry_improving_steps": False, - "safety_steps": True, - "shrink_upper_radius_in_safety_steps": False, - "full_geometry_improving_step": False, - "reset_trustregion_radius_after_fast_start": False, - "reset_min_trustregion_radius_after_fast_start": False, - "shrinking_factor_not_successful": None, - "n_extra_search_directions_per_iteration": 0, -} -r"""dict: Options to start the optimization while building the full trust region model. - - To activate this, set the number of interpolation points at which to evaluate the - criterion before doing the first step, `min_initial_points`, to something smaller - than the number of parameters. - - The following options can be specified: - - min_initial_points (int): Number of initial interpolation - points in addition to the start point. This should only be changed to - a value less than ``len(x)``, and only if the default setup cost - of ``len(x) + 1`` evaluations of the criterion is impractical. - If this is set to be less than the default, the input value of - ``n_interpolation_points`` should be set to ``len(x)``. - If the default is used, all the other parameters have no effect. - Default is ``n_interpolation_points - 1``. - If the default setup costs of the evaluations are very large, DF-OLS - can start with less than ``len(x)`` interpolation points and add points - to the trust region model with every iteration. - method ("jacobian", "trustregion" or "auto"): - When there are less interpolation points than ``len(x)`` the model is - underdetermined. This can be fixed in two ways: - If "jacobian", the interpolated Jacobian is perturbed to have full - rank, allowing the trust region step to include components in the full - search space. This is the default if - ``len(x) \geq number of root contributions``. - If "trustregion_step", the trust region step is perturbed by an - orthogonal direction not yet searched. It is the default if - ``len(x) < number of root contributions``. - scale_of_trustregion_step_perturbation (float): - When adding new search directions, the length of the step is the trust - region radius multiplied by this value. The default is 0.1 if - ``method == "trustregion"`` else 1. - scale_of_jacobian_components_perturbation (float): Magnitude of extra - components added to the Jacobian. Default is 1e-2. - floor_of_jacobian_singular_values (float): Floor singular - values of the Jacobian at this factor of the last non zero value. - As of version 1.2.1 this option is not yet supported by DF-OLS! - scale_of_jacobian_singular_value_floor (float): - Floor singular values of the Jacobian at this factor of the last nonzero - value. - jacobian_max_condition_number (float): Cap on the condition number - of Jacobian after applying floors to singular values - (effectively another floor on the smallest singular value, since the - largest singular value is fixed). - geometry_improving_steps (bool): Whether to do geometry-improving steps in the - trust region algorithm, as per the usual algorithm during the fast start. - safety_steps (bool): - Whether to perform safety steps. - shrink_upper_radius_in_safety_steps (bool): During the fast start whether to - shrink the upper trust region radius in safety steps. - full_geometry_improving_step (bool): During the fast start whether to do a - full geometry-improving step within safety steps (the same as the post fast - start phase of the algorithm). Since this involves reducing the upper trust - region radius, this can only be `True` if - `shrink_upper_radius_in_safety_steps == False`. - reset_trustregion_radius_after_fast_start (bool): - Whether or not to reset the upper trust region radius to its initial value - at the end of the fast start phase. - reset_min_trustregion_radius_after_fast_start (bool): - Whether or not to reset the minimum trust region radius - (:math:`\rho_k`) to its initial value at the end of the fast start phase. - shrinking_factor_not_successful (float): - Ratio by which to shrink the trust region radius when realized - improvement does not match the ``threshold_for_successful_iteration`` - during the fast start phase. By default it is the same as - ``reduction_when_not_successful``. - n_extra_search_directions_per_iteration (int): Number of new search - directions to add with each iteration where we do not have a full set - of search directions. This approach is not recommended! Default is 0. - -""" - def get_population_size(population_size, x, lower_bound=10): """Default population size for genetic algorithms.""" diff --git a/src/optimagic/optimizers/nag_optimizers.py b/src/optimagic/optimizers/nag_optimizers.py index 6dc35c6bf..9c1dab381 100644 --- a/src/optimagic/optimizers/nag_optimizers.py +++ b/src/optimagic/optimizers/nag_optimizers.py @@ -15,27 +15,8 @@ from optimagic.config import IS_DFOLS_INSTALLED, IS_PYBOBYQA_INSTALLED from optimagic.decorators import mark_minimizer from optimagic.exceptions import NotInstalledError -from optimagic.optimization.algo_options import ( - CLIP_CRITERION_IF_OVERFLOWING, - CONVERGENCE_MINIMAL_TRUSTREGION_RADIUS_TOLERANCE, - CONVERGENCE_NOISE_CORRECTED_FTOL, - CONVERGENCE_SLOW_PROGRESS, - INITIAL_DIRECTIONS, - INTERPOLATION_ROUNDING_ERROR, - RANDOM_DIRECTIONS_ORTHOGONAL, - RESET_OPTIONS, - STOPPING_MAXFUN, - THRESHOLD_FOR_SAFETY_STEP, - TRUSTREGION_EXPANSION_FACTOR_SUCCESSFUL, - TRUSTREGION_EXPANSION_FACTOR_VERY_SUCCESSFUL, - TRUSTREGION_FAST_START_OPTIONS, - TRUSTREGION_PRECONDITION_INTERPOLATION, - TRUSTREGION_SHRINKING_FACTOR_LOWER_RADIUS, - TRUSTREGION_SHRINKING_FACTOR_NOT_SUCCESSFUL, - TRUSTREGION_SHRINKING_FACTOR_UPPER_RADIUS, - TRUSTREGION_THRESHOLD_SUCCESSFUL, - TRUSTREGION_THRESHOLD_VERY_SUCCESSFUL, -) +from optimagic.optimization.algo_options import STOPPING_MAXFUN + from optimagic.utilities import calculate_trustregion_initial_radius if IS_PYBOBYQA_INSTALLED: @@ -45,6 +26,310 @@ import dfols +CONVERGENCE_MINIMAL_TRUSTREGION_RADIUS_TOLERANCE = 1e-8 +"""float: Stop when the lower trust region radius falls below this value.""" + +CONVERGENCE_SLOW_PROGRESS = { + "threshold_to_characterize_as_slow": 1e-8, + "max_insufficient_improvements": None, + "comparison_period": 5, +} +"""dict: Specification of when to terminate or reset the optimization because of only + slow improvements. This is similar to an absolute criterion tolerance only that + instead of a single improvement the average over several iterations must be small. + + Possible entries are: + threshold_to_characterize_as_slow (float): Threshold whether an improvement + is insufficient. Note: the improvement is divided by the + ``comparison_period``. + So this is the required average improvement per iteration over the + comparison period. + max_insufficient_improvements (int): Number of consecutive + insufficient improvements before termination (or reset). Default is + ``20 * len(x)``. + comparison_period (int): + How many iterations to go back to calculate the improvement. + For example 5 would mean that each criterion evaluation is compared to the + criterion value from 5 iterations before. + +""" + +THRESHOLD_FOR_SAFETY_STEP = 0.5 +r"""float: Threshold for when to call the safety step (:math:`\gamma_s`). + + :math:`\text{proposed step} \leq \text{threshold_for_safety_step} \cdot + \text{current_lower_trustregion_radius}`. + +""" + +CONVERGENCE_NOISE_CORRECTED_FTOL = 1.0 +"""float: Stop when the evaluations on the set of interpolation points all fall within + this factor of the noise level. The default is 1, i.e. when all evaluations are + within the noise level. If you want to not use this criterion but still flag your + criterion function as noisy, set this tolerance to 0.0. + + .. warning:: + Very small values, as in most other tolerances don't make sense here. + +""" + + +TRUSTREGION_THRESHOLD_SUCCESSFUL = 0.1 +"""float: Share of the predicted improvement that has to be achieved for a trust + region iteration to count as successful. + +""" + +TRUSTREGION_THRESHOLD_VERY_SUCCESSFUL = 0.7 +"""float: Share of predicted improvement that has to be achieved for a trust region + iteration to count as very successful.``criterion_noisy`` + +""" + +TRUSTREGION_SHRINKING_FACTOR_NOT_SUCCESSFUL = None +"""float: Ratio by which to shrink the upper trust region radius when realized + improvement does not match the ``threshold_successful``. The default is 0.98 + if the criterion is noisy and 0.5 else. + +""" + +TRUSTREGION_EXPANSION_FACTOR_SUCCESSFUL = 2.0 +r"""float: Ratio by which to expand the upper trust region radius :math:`\Delta_k` + in very successful iterations (:math:`\gamma_{inc}` in the notation of the paper). + +""" + +TRUSTREGION_EXPANSION_FACTOR_VERY_SUCCESSFUL = 4.0 +r"""float: Ratio of the proposed step ($\|s_k\|$) by which to expand the upper trust + region radius (:math:`\Delta_k`) in very successful iterations + (:math:`\overline{\gamma}_{inc}` in the notation of the paper). + +""" + +TRUSTREGION_SHRINKING_FACTOR_LOWER_RADIUS = None +r"""float: Ratio by which to shrink the lower trust region radius (:math:`\rho_k`) + (:math:`\alpha_1` in the notation of the paper). Default is 0.9 if + the criterion is noisy and 0.1 else. + +""" + +TRUSTREGION_SHRINKING_FACTOR_UPPER_RADIUS = None +r"""float: Ratio of the current lower trust region (:math:`\rho_k`) by which to shrink + the upper trust region radius (:math:`\Delta_k`) when the lower one is shrunk + (:math:`\alpha_2` in the notation of the paper). Default is 0.95 if the + criterion is noisy and 0.5 else.""" + + +INITIAL_DIRECTIONS = "coordinate" +"""string: How to draw the initial directions. Possible values are "coordinate" for + coordinate directions (the default) or "random". + +""" + +RANDOM_DIRECTIONS_ORTHOGONAL = True +"""bool: Whether to make randomly drawn initial directions orthogonal.""" + + +INTERPOLATION_ROUNDING_ERROR = 0.1 +r"""float: Internally, all the NAG algorithms store interpolation points with respect + to a base point :math:`x_b`; that is, we store :math:`\{y_t-x_b\}`, + which reduces the risk of roundoff errors. We shift :math:`x_b` to :math:`x_k` when + :math:`\text{proposed step} \leq \text{interpolation_rounding_error} \cdot + \|x_k-x_b\|`. + +""" + +CLIP_CRITERION_IF_OVERFLOWING = True +"""bool: Whether to clip the criterion to avoid ``OverflowError``.""" + + +TRUSTREGION_PRECONDITION_INTERPOLATION = True +"""bool: whether to scale the interpolation linear system to improve conditioning.""" + + +RESET_OPTIONS = { + "use_resets": None, + "minimal_trustregion_radius_tolerance_scaling_at_reset": 1.0, + "reset_type": "soft", + "move_center_at_soft_reset": True, + "reuse_criterion_value_at_hard_reset": True, + "max_iterations_without_new_best_after_soft_reset": None, + "auto_detect": True, + "auto_detect_history": 30, + "auto_detect_min_jacobian_increase": 0.015, + "auto_detect_min_correlations": 0.1, + "points_to_replace_at_soft_reset": 3, + "max_consecutive_unsuccessful_resets": 10, + # just bobyqa + "max_unsuccessful_resets": None, + "trust_region_scaling_at_unsuccessful_reset": None, + # just dfols + "max_interpolation_points": None, + "n_extra_interpolation_points_per_soft_reset": 0, + "n_extra_interpolation_points_per_hard_reset": 0, + "n_additional_extra_points_to_replace_per_reset": 0, +} +r"""dict: Options for reseting the optimization. + + Possible entries are: + + use_resets (bool): Whether to do resets when the lower trust + region radius (:math:`\rho_k`) reaches the stopping criterion + (:math:`\rho_{end}`), or (optionally) when all interpolation points are + within noise level. Default is ``True`` if the criterion is noisy. + minimal_trustregion_radius_tolerance_scaling_at_reset (float): Factor with + which the trust region stopping criterion is multiplied at each reset. + + reset_type (str): Whether to use "soft" or "hard" resets. Default is "soft". + + move_center_at_soft_reset (bool): Whether to move the trust region center + ($x_k$) to the best new point evaluated in stead of keeping it constant. + points_to_replace_at_soft_reset (int): Number of interpolation points to move + at each soft reset. + reuse_criterion_value_at_hard_reset (bool): Whether or not to recycle the + criterion value at the best iterate found when performing a hard reset. + This saves one criterion evaluation. + max_iterations_without_new_best_after_soft_reset (int): + The maximum number of successful steps in a given run where the new + criterion value is worse than the best value found in previous runs before + terminating. Default is ``max_criterion_evaluations``. + auto_detect (bool): Whether or not to + automatically determine when to reset. This is an additional condition + and resets can still be triggered by small upper trust region radius, etc. + There are two criteria used: upper trust region radius shrinkage + (no increases over the history, more decreases than no changes) and + changes in the model Jacobian (consistently increasing trend as measured + by slope and correlation coefficient of the line of best fit). + auto_detect_history (int): + How many iterations of model changes and trust region radii to store. + auto_detect_min_jacobian_increase (float): + Minimum rate of increase of the Jacobian over past iterations to cause a + reset. + auto_detect_min_correlations (float): + Minimum correlation of the Jacobian data set required to cause a reset. + max_consecutive_unsuccessful_resets (int): maximum number of consecutive + unsuccessful resets allowed (i.e. resets which did not outperform the + best known value from earlier runs). + + Only used when using nag_bobyqa: + + max_unsuccessful_resets (int): + number of total unsuccessful resets allowed. + Default is 20 if ``seek_global_optimum`` and else unrestricted. + trust_region_scaling_at_unsuccessful_reset (float): Factor by which to + expand the initial lower trust region radius (:math:`\rho_{beg}`) after + unsuccessful resets. Default is 1.1 if ``seek_global_optimum`` else 1. + + Only used when using nag_dfols: + + max_interpolation_points (int): Maximum allowed value of the number of + interpolation points. This is useful if the number of interpolation points + increases with each reset, e.g. when + ``n_extra_interpolation_points_per_soft_reset > 0``. The default is + ``n_interpolation_points``. + n_extra_interpolation_points_per_soft_reset (int): Number of points to add to + the interpolation set with each soft reset. + n_extra_interpolation_points_per_hard_reset (int): Number of points to add to + the interpolation set with each hard reset. + n_additional_extra_points_to_replace_per_reset (int): This parameter modifies + ``n_extra_points_to_replace_successful``. With each reset + ``n_extra_points_to_replace_successful`` is increased by this number. + +""" + + +TRUSTREGION_FAST_START_OPTIONS = { + "min_inital_points": None, + "method": "auto", + "scale_of_trustregion_step_perturbation": None, + "scale_of_jacobian_components_perturbation": 1e-2, + # the following will be growing.full_rank.min_sing_val + # but it not supported yet by DF-OLS. + "floor_of_jacobian_singular_values": 1, + "jacobian_max_condition_number": 1e8, + "geometry_improving_steps": False, + "safety_steps": True, + "shrink_upper_radius_in_safety_steps": False, + "full_geometry_improving_step": False, + "reset_trustregion_radius_after_fast_start": False, + "reset_min_trustregion_radius_after_fast_start": False, + "shrinking_factor_not_successful": None, + "n_extra_search_directions_per_iteration": 0, +} +r"""dict: Options to start the optimization while building the full trust region model. + + To activate this, set the number of interpolation points at which to evaluate the + criterion before doing the first step, `min_initial_points`, to something smaller + than the number of parameters. + + The following options can be specified: + + min_initial_points (int): Number of initial interpolation + points in addition to the start point. This should only be changed to + a value less than ``len(x)``, and only if the default setup cost + of ``len(x) + 1`` evaluations of the criterion is impractical. + If this is set to be less than the default, the input value of + ``n_interpolation_points`` should be set to ``len(x)``. + If the default is used, all the other parameters have no effect. + Default is ``n_interpolation_points - 1``. + If the default setup costs of the evaluations are very large, DF-OLS + can start with less than ``len(x)`` interpolation points and add points + to the trust region model with every iteration. + method ("jacobian", "trustregion" or "auto"): + When there are less interpolation points than ``len(x)`` the model is + underdetermined. This can be fixed in two ways: + If "jacobian", the interpolated Jacobian is perturbed to have full + rank, allowing the trust region step to include components in the full + search space. This is the default if + ``len(x) \geq number of root contributions``. + If "trustregion_step", the trust region step is perturbed by an + orthogonal direction not yet searched. It is the default if + ``len(x) < number of root contributions``. + scale_of_trustregion_step_perturbation (float): + When adding new search directions, the length of the step is the trust + region radius multiplied by this value. The default is 0.1 if + ``method == "trustregion"`` else 1. + scale_of_jacobian_components_perturbation (float): Magnitude of extra + components added to the Jacobian. Default is 1e-2. + floor_of_jacobian_singular_values (float): Floor singular + values of the Jacobian at this factor of the last non zero value. + As of version 1.2.1 this option is not yet supported by DF-OLS! + scale_of_jacobian_singular_value_floor (float): + Floor singular values of the Jacobian at this factor of the last nonzero + value. + jacobian_max_condition_number (float): Cap on the condition number + of Jacobian after applying floors to singular values + (effectively another floor on the smallest singular value, since the + largest singular value is fixed). + geometry_improving_steps (bool): Whether to do geometry-improving steps in the + trust region algorithm, as per the usual algorithm during the fast start. + safety_steps (bool): + Whether to perform safety steps. + shrink_upper_radius_in_safety_steps (bool): During the fast start whether to + shrink the upper trust region radius in safety steps. + full_geometry_improving_step (bool): During the fast start whether to do a + full geometry-improving step within safety steps (the same as the post fast + start phase of the algorithm). Since this involves reducing the upper trust + region radius, this can only be `True` if + `shrink_upper_radius_in_safety_steps == False`. + reset_trustregion_radius_after_fast_start (bool): + Whether or not to reset the upper trust region radius to its initial value + at the end of the fast start phase. + reset_min_trustregion_radius_after_fast_start (bool): + Whether or not to reset the minimum trust region radius + (:math:`\rho_k`) to its initial value at the end of the fast start phase. + shrinking_factor_not_successful (float): + Ratio by which to shrink the trust region radius when realized + improvement does not match the ``threshold_for_successful_iteration`` + during the fast start phase. By default it is the same as + ``reduction_when_not_successful``. + n_extra_search_directions_per_iteration (int): Number of new search + directions to add with each iteration where we do not have a full set + of search directions. This approach is not recommended! Default is 0. + +""" + + @mark_minimizer( name="nag_dfols", primary_criterion_entry="root_contributions", From 6d366a7342580a1d5bfebf95fd79563f64c2e133 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Thu, 18 Jul 2024 19:16:45 +0200 Subject: [PATCH 17/25] Cleanup. --- docs/source/how_to/how_to_specify_algorithm_and_algo_options.md | 1 - 1 file changed, 1 deletion(-) diff --git a/docs/source/how_to/how_to_specify_algorithm_and_algo_options.md b/docs/source/how_to/how_to_specify_algorithm_and_algo_options.md index 4472c1f52..3e9550bb5 100644 --- a/docs/source/how_to/how_to_specify_algorithm_and_algo_options.md +++ b/docs/source/how_to/how_to_specify_algorithm_and_algo_options.md @@ -35,7 +35,6 @@ algo_options = { "trustregion.shrinking_factor.not_successful": 0.4, "trustregion.shrinking_factor.lower_radius": 0.2, "trustregion.shrinking_factor.upper_radius": 0.8, - "convergence.scaled_criterion_tolerance": 0.0, "convergence.noise_corrected_criterion_tolerance": 1.1, } ``` From 18adaf33f7ae25ade7e2f1f12f33697f81430aeb Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Fri, 19 Jul 2024 10:22:56 +0200 Subject: [PATCH 18/25] Support jac=True and add more tests. --- CHANGES.md | 35 ++++++++++++++++++- src/optimagic/optimization/optimize.py | 14 +++++++- src/optimagic/optimization/scipy_aliases.py | 23 ++++++++++++ .../optimization/test_scipy_aliases.py | 20 +++++++++++ tests/test_deprecations.py | 28 +++++++++++++++ 5 files changed, 118 insertions(+), 2 deletions(-) diff --git a/CHANGES.md b/CHANGES.md index 51683d4cb..d2fab99e8 100644 --- a/CHANGES.md +++ b/CHANGES.md @@ -18,10 +18,43 @@ the major changes are: - Rename the package from `estimagic` to `optimagic` (while keeping the `estimagic` namespace for the estimation capabilities). -### Breaking changes - {gh}`500` removes the dashboard, the support for simopt optimizers and the `derivative_plot` ({ghuser}`janosg`) +- {gh}`504` aligns `maximize` and `minimize` more closely with scipy. All related + deprecations and breaking changes are listed below. As a result, scipy code that uses + minimize with the arguments `x0`, `fun`, `jac` and `method` will run without changes + in optimagic. Similarly, to `OptimizeResult` gets some aliases so it behaves more + like SciPy's. + +### Breaking changes + + +### Deprecations + +- The `criterion` argument of `maximize` and `minimize` is renamed to `fun` (as in + SciPy). +- The `derivative` argument of `maximize` and `minimize` is renamed to `jac` (as + in SciPy) +- The `criterion_and_derivative` argument of `maximize` and `minimize` is renamed + to `fun_and_jac` to align it with the other names. +- The `criterion_kwargs` argument of `maximize` and `minimize` is renamed to + `fun_kwargs` to align it with the other names. +- The `derivative_kwargs` argument of `maximize` and `minimize` is renamed to + `jac_kwargs` to align it with the other names. +- The `criterion_and_derivative_kwargs` argument of `maximize` and `minimize` is + renamed to `fun_and_jac_kwargs` to align it with the other names. +- Algorithm specific convergence and stopping criteria are renamed to align them more + with NlOpt and SciPy names. + - `convergence_relative_criterion_tolerance` -> `convergence_ftol_rel` + - `convergence_absolute_criterion_tolerance` -> `convergence_ftol_abs` + - `convergence_relative_params_tolerance` -> `convergence_xtol_rel` + - `convergence_absolute_params_tolerance` -> `convergence_xtol_abs` + - `convergence_relative_gradient_tolerance` -> `convergence_gtol_rel` + - `convergence_absolute_gradient_tolerance` -> `convergence_gtol_abs` + - `convergence_scaled_gradient_tolerance` -> `convergence_gtol_scaled` + - `stopping_max_criterion_evaluations` -> `stopping_maxfun` + - `stopping_max_iterations` -> `stopping_maxiter` ## 0.4.7 diff --git a/src/optimagic/optimization/optimize.py b/src/optimagic/optimization/optimize.py index 4c9074d53..348b85d9f 100644 --- a/src/optimagic/optimization/optimize.py +++ b/src/optimagic/optimization/optimize.py @@ -38,7 +38,10 @@ process_func_of_params, get_kwargs_from_args, ) -from optimagic.optimization.scipy_aliases import map_method_to_algorithm +from optimagic.optimization.scipy_aliases import ( + map_method_to_algorithm, + split_fun_and_jac, +) from optimagic import deprecations from optimagic.deprecations import replace_and_warn_about_deprecated_algo_options @@ -390,6 +393,15 @@ def _optimize( kwargs = get_kwargs_from_args(args, fun, offset=1) fun_kwargs, jac_kwargs, fun_and_jac_kwargs = kwargs, kwargs, kwargs + # jac is not an alias but we need to handle the case where `jac=True`, i.e. fun is + # actually fun_and_jac. This is not recommended in optimagic because then optimizers + # cannot evaluate fun in isolation but we can easily support it for compatibility. + if jac is True: + jac = None + if fun_and_jac is None: + fun_and_jac = fun + fun = split_fun_and_jac(fun_and_jac, target="fun") + # ================================================================================== # Handle scipy arguments that are not yet implemented # ================================================================================== diff --git a/src/optimagic/optimization/scipy_aliases.py b/src/optimagic/optimization/scipy_aliases.py index 434e6f5e6..4473ebec8 100644 --- a/src/optimagic/optimization/scipy_aliases.py +++ b/src/optimagic/optimization/scipy_aliases.py @@ -1,4 +1,6 @@ from optimagic.utilities import propose_alternatives +import functools +from optimagic.exceptions import InvalidFunctionError def map_method_to_algorithm(method): @@ -41,3 +43,24 @@ def map_method_to_algorithm(method): ) raise ValueError(msg) return algo + + +def split_fun_and_jac(fun_and_jac, target="fun"): + + index = 0 if target == "fun" else 1 + + @functools.wraps(fun_and_jac) + def fun(*args, **kwargs): + raw = fun_and_jac(*args, **kwargs) + try: + out = raw[index] + except TypeError as e: + msg = ( + "If you set `jac=True`, `fun` needs to return a tuple where the first " + "entry is the value of your objective function and the second entry " + "is its derivative." + ) + raise InvalidFunctionError(msg) from e + return out + + return fun diff --git a/tests/optimagic/optimization/test_scipy_aliases.py b/tests/optimagic/optimization/test_scipy_aliases.py index 022e7907f..e0cfbb730 100644 --- a/tests/optimagic/optimization/test_scipy_aliases.py +++ b/tests/optimagic/optimization/test_scipy_aliases.py @@ -181,3 +181,23 @@ def test_args_does_not_work_with_together_with_any_kwargs(): args=(1,), fun_kwargs={"a": 1}, ) + + +def test_jac_equal_true_works_in_minimize(): + res = om.minimize( + fun=lambda x: (x @ x, 2 * x), + params=np.arange(3), + algorithm="scipy_lbfgsb", + jac=True, + ) + aaae(res.params, np.zeros(3)) + + +def test_jac_equal_true_works_in_maximize(): + res = om.maximize( + fun=lambda x: (-x @ x, -2 * x), + params=np.arange(3), + algorithm="scipy_lbfgsb", + jac=True, + ) + aaae(res.params, np.zeros(3)) diff --git a/tests/test_deprecations.py b/tests/test_deprecations.py index 6a2998126..321753152 100644 --- a/tests/test_deprecations.py +++ b/tests/test_deprecations.py @@ -25,6 +25,7 @@ from estimagic import OptimizeLogReader, OptimizeResult from estimagic import criterion_plot, params_plot import optimagic as om +import warnings # ====================================================================================== # Deprecated in 0.5.0, remove in 0.6.0 @@ -342,3 +343,30 @@ def test_criterion_and_derivative_kwargs_is_deprecated(): fun_and_jac=lambda x, a: (x @ x, 2 * x), criterion_and_derivative_kwargs={"a": 1}, ) + + +ALGO_OPTIONS = [ + {"convergence_absolute_criterion_tolerance": 1e-8}, + {"convergence_relative_criterion_tolerance": 1e-8}, + {"convergence_absolute_params_tolerance": 1e-8}, + {"convergence_relative_params_tolerance": 1e-8}, + {"convergence_absolute_gradient_tolerance": 1e-8}, + {"convergence_relative_gradient_tolerance": 1e-8}, + {"convergence_scaled_gradient_tolerance": 1e-8}, + {"stopping_max_iterations": 1_000}, + {"stopping_max_criterion_evaluations": 1_000}, +] + + +@pytest.mark.parametrize("algo_option", ALGO_OPTIONS) +def test_old_convergence_criteria_are_deprecated(algo_option): + msg = "The following keys in `algo_options` are deprecated" + with warnings.catch_warnings(): + warnings.simplefilter("ignore", category=UserWarning) + with pytest.warns(FutureWarning, match=msg): + om.minimize( + lambda x: x @ x, + params=np.arange(3), + algorithm="scipy_lbfgsb", + algo_options=algo_option, + ) From 3e625a48f8c1334db4db8d3829788b5707f32c81 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Fri, 19 Jul 2024 11:13:36 +0200 Subject: [PATCH 19/25] Rename some attributes of OptimizeResult. --- .../source/explanation/internal_optimizers.md | 4 +- src/optimagic/optimization/optimize.py | 2 +- src/optimagic/optimization/optimize_result.py | 56 +++++++++++++++---- src/optimagic/optimization/process_results.py | 20 +++---- src/optimagic/optimizers/nlopt_optimizers.py | 4 +- src/optimagic/optimizers/pygmo_optimizers.py | 4 +- src/optimagic/optimizers/scipy_optimizers.py | 4 +- src/optimagic/optimizers/tao_optimizers.py | 4 +- .../optimization/test_history_collection.py | 2 +- .../optimagic/optimization/test_multistart.py | 2 +- tests/optimagic/optimization/test_optimize.py | 2 +- .../optimization/test_optimize_result.py | 8 +-- tests/test_deprecations.py | 22 +++++++- 13 files changed, 93 insertions(+), 41 deletions(-) diff --git a/docs/source/explanation/internal_optimizers.md b/docs/source/explanation/internal_optimizers.md index a99b56348..3ee33f806 100644 --- a/docs/source/explanation/internal_optimizers.md +++ b/docs/source/explanation/internal_optimizers.md @@ -56,8 +56,8 @@ should return a dictionary with the following entries: - solution_x: The best parameter achieved so far - solution_criterion: The value of the criterion at solution_x. This can be a scalar or dictionary. -- n_criterion_evaluations: The number of criterion evaluations. -- n_derivative_evaluations: The number of derivative evaluations. +- n_fun_evals: The number of criterion evaluations. +- n_jac_evals: The number of derivative evaluations. - n_iterations: The number of iterations - success: True if convergence was achieved - message: A string with additional information. diff --git a/src/optimagic/optimization/optimize.py b/src/optimagic/optimization/optimize.py index 348b85d9f..9140984f3 100644 --- a/src/optimagic/optimization/optimize.py +++ b/src/optimagic/optimization/optimize.py @@ -761,7 +761,7 @@ def _optimize( ) fixed_result_kwargs = { - "start_criterion": _scalar_start_criterion, + "start_fun": _scalar_start_criterion, "start_params": params, "algorithm": algo_info.name, "direction": direction, diff --git a/src/optimagic/optimization/optimize_result.py b/src/optimagic/optimization/optimize_result.py index 3f9a4a0fc..334728246 100644 --- a/src/optimagic/optimization/optimize_result.py +++ b/src/optimagic/optimization/optimize_result.py @@ -6,6 +6,7 @@ from optimagic.utilities import to_pickle from optimagic.shared.compat import pd_df_map +import warnings @dataclass @@ -16,8 +17,8 @@ class OptimizeResult: Attributes: params (Any): The optimal parameters. - criterion (float): The optimal criterion value. - start_criterion (float): The criterion value at the start parameters. + fun (float): The optimal criterion value. + start_fun (float): The criterion value at the start parameters. start_params (Any): The start parameters. algorithm (str): The algorithm used for the optimization. direction (str): Maximize or minimize. @@ -38,8 +39,8 @@ class OptimizeResult: """ params: Any - criterion: float - start_criterion: float + fun: float + start_fun: float start_params: Any algorithm: str direction: str @@ -47,8 +48,8 @@ class OptimizeResult: message: Union[str, None] = None success: Union[bool, None] = None - n_criterion_evaluations: Union[int, None] = None - n_derivative_evaluations: Union[int, None] = None + n_fun_evals: Union[int, None] = None + n_jac_evals: Union[int, None] = None n_iterations: Union[int, None] = None history: Union[Dict, None] = None @@ -58,6 +59,39 @@ class OptimizeResult: multistart_info: Union[Dict, None] = None algorithm_output: Dict = field(default_factory=dict) + @property + def criterion(self): + msg = "The criterion attribute is deprecated. Use the fun attribute instead." + warnings.warn(msg, FutureWarning) + return self.fun + + @property + def start_criterion(self): + msg = ( + "The start_criterion attribute is deprecated. Use the start_fun attribute " + "instead." + ) + warnings.warn(msg, FutureWarning) + return self.start_fun + + @property + def n_criterion_evaluations(self): + msg = ( + "The n_criterion_evaluations attribute is deprecated. Use the n_fun_evals " + "attribute instead." + ) + warnings.warn(msg, FutureWarning) + return self.n_fun_evals + + @property + def n_derivative_evaluations(self): + msg = ( + "The n_derivative_evaluations attribute is deprecated. Use the n_jac_evals " + "attribute instead." + ) + warnings.warn(msg, FutureWarning) + return self.n_jac_evals + def __repr__(self): first_line = ( f"{self.direction.title()} with {self.n_free} free parameters terminated" @@ -68,8 +102,8 @@ def __repr__(self): first_line += f" {snippet}" counters = [ - ("criterion evaluations", self.n_criterion_evaluations), - ("derivative evaluations", self.n_derivative_evaluations), + ("criterion evaluations", self.n_fun_evals), + ("derivative evaluations", self.n_jac_evals), ("iterations", self.n_iterations), ] @@ -93,10 +127,10 @@ def __repr__(self): else: message = None - if self.start_criterion is not None and self.criterion is not None: + if self.start_fun is not None and self.fun is not None: improvement = ( - f"The value of criterion improved from {self.start_criterion} to " - f"{self.criterion}." + f"The value of criterion improved from {self.start_fun} to " + f"{self.fun}." ) else: improvement = None diff --git a/src/optimagic/optimization/process_results.py b/src/optimagic/optimization/process_results.py index 7c02a6053..cdea70133 100644 --- a/src/optimagic/optimization/process_results.py +++ b/src/optimagic/optimization/process_results.py @@ -37,7 +37,7 @@ def process_internal_optimizer_result( skip_checks=skip_checks, ) - crit_hist = [opt.criterion for opt in info["local_optima"]] + crit_hist = [opt.fun for opt in info["local_optima"]] params_hist = [opt.params for opt in info["local_optima"]] time_hist = [np.nan for opt in info["local_optima"]] hist = {"criterion": crit_hist, "params": params_hist, "runtime": time_hist} @@ -54,11 +54,11 @@ def process_internal_optimizer_result( [opt.n_iterations for opt in info["local_optima"]] ) - res.n_criterion_evaluations = _sum_or_none( - [opt.n_criterion_evaluations for opt in info["local_optima"]] + res.n_fun_evals = _sum_or_none( + [opt.n_fun_evals for opt in info["local_optima"]] ) - res.n_derivative_evaluations = _sum_or_none( - [opt.n_derivative_evaluations for opt in info["local_optima"]] + res.n_jac_evals = _sum_or_none( + [opt.n_jac_evals for opt in info["local_optima"]] ) res.multistart_info = info @@ -78,8 +78,8 @@ def _process_one_result(res, converter, primary_key, fixed_kwargs, skip_checks): _criterion = -_criterion optional_entries = [ - "n_criterion_evaluations", - "n_derivative_evaluations", + "n_fun_evals", + "n_jac_evals", "n_iterations", "success", "message", @@ -107,7 +107,7 @@ def _process_one_result(res, converter, primary_key, fixed_kwargs, skip_checks): out = OptimizeResult( params=_params, - criterion=_criterion, + fun=_criterion, **fixed_kwargs, **optional_kwargs, algorithm_output=algo_output, @@ -126,7 +126,7 @@ def _process_multistart_info(info, converter, primary_key, fixed_kwargs, skip_ch for res, start in zip(info["local_optima"], starts): kwargs = fixed_kwargs.copy() kwargs["start_params"] = start - kwargs["start_criterion"] = None + kwargs["start_fun"] = None processed = _process_one_result( res, converter=converter, @@ -155,7 +155,7 @@ def _process_multistart_info(info, converter, primary_key, fixed_kwargs, skip_ch def _dummy_result_from_traceback(candidate, fixed_kwargs): # noqa: ARG001 out = OptimizeResult( params=None, - criterion=None, + fun=None, **fixed_kwargs, ) return out diff --git a/src/optimagic/optimizers/nlopt_optimizers.py b/src/optimagic/optimizers/nlopt_optimizers.py index 55056bec9..2896d31a0 100644 --- a/src/optimagic/optimizers/nlopt_optimizers.py +++ b/src/optimagic/optimizers/nlopt_optimizers.py @@ -843,8 +843,8 @@ def _process_nlopt_results(nlopt_obj, solution_x): "solution_criterion": nlopt_obj.last_optimum_value(), "solution_derivative": None, "solution_hessian": None, - "n_criterion_evaluations": nlopt_obj.get_numevals(), - "n_derivative_evaluations": None, + "n_fun_evals": nlopt_obj.get_numevals(), + "n_jac_evals": None, "n_iterations": None, "success": nlopt_obj.last_optimize_result() in [1, 2, 3, 4], "message": messages[nlopt_obj.last_optimize_result()], diff --git a/src/optimagic/optimizers/pygmo_optimizers.py b/src/optimagic/optimizers/pygmo_optimizers.py index 7a907d327..96287e789 100644 --- a/src/optimagic/optimizers/pygmo_optimizers.py +++ b/src/optimagic/optimizers/pygmo_optimizers.py @@ -1326,8 +1326,8 @@ def _process_pygmo_results(evolved): "solution_criterion": evolved.champion_f[0], "solution_derivative": None, "solution_hessian": None, - "n_criterion_evaluations": evolved.problem.get_fevals(), - "n_derivative_evaluations": evolved.problem.get_gevals(), + "n_fun_evals": evolved.problem.get_fevals(), + "n_jac_evals": evolved.problem.get_gevals(), "n_iterations": None, "success": True, "reached_convergence_criterion": "Number of generations reached.", diff --git a/src/optimagic/optimizers/scipy_optimizers.py b/src/optimagic/optimizers/scipy_optimizers.py index 602367188..7b459c5f3 100644 --- a/src/optimagic/optimizers/scipy_optimizers.py +++ b/src/optimagic/optimizers/scipy_optimizers.py @@ -451,8 +451,8 @@ def process_scipy_result(scipy_results_obj): "solution_criterion": raw_res.get("fun"), "solution_derivative": raw_res.get("jac"), "solution_hessian": raw_res.get("hess"), - "n_criterion_evaluations": raw_res.get("nfev"), - "n_derivative_evaluations": raw_res.get("njac") or raw_res.get("njev"), + "n_fun_evals": raw_res.get("nfev"), + "n_jac_evals": raw_res.get("njac") or raw_res.get("njev"), "n_iterations": raw_res.get("nit"), "success": raw_res.get("success"), "reached_convergence_criterion": None, diff --git a/src/optimagic/optimizers/tao_optimizers.py b/src/optimagic/optimizers/tao_optimizers.py index 64c221e81..012d1a934 100644 --- a/src/optimagic/optimizers/tao_optimizers.py +++ b/src/optimagic/optimizers/tao_optimizers.py @@ -232,8 +232,8 @@ def _process_pounders_results(residuals_out, tao): "solution_criterion": tao.function, "solution_derivative": None, "solution_hessian": None, - "n_criterion_evaluations": tao.getIterationNumber(), - "n_derivative_evaluations": None, + "n_fun_evals": tao.getIterationNumber(), + "n_jac_evals": None, "n_iterations": None, "success": bool(convergence_code >= 0), "reached_convergence_criterion": ( diff --git a/tests/optimagic/optimization/test_history_collection.py b/tests/optimagic/optimization/test_history_collection.py index 51381b12a..e3d2409a6 100644 --- a/tests/optimagic/optimization/test_history_collection.py +++ b/tests/optimagic/optimization/test_history_collection.py @@ -68,7 +68,7 @@ def _dummy_optimizer(criterion, x, n_cores, batch_size, batch_evaluator): out = { "solution_x": xs[-1], "solution_criterion": 5, - "n_criterion_evaluations": 15, + "n_fun_evals": 15, "n_iterations": 3, "success": True, } diff --git a/tests/optimagic/optimization/test_multistart.py b/tests/optimagic/optimization/test_multistart.py index 6806af2e5..fbcd5c92d 100644 --- a/tests/optimagic/optimization/test_multistart.py +++ b/tests/optimagic/optimization/test_multistart.py @@ -56,7 +56,7 @@ def test_multistart_minimize_with_sum_of_squares_at_defaults( assert all(isinstance(entry, float) for entry in ms_info["exploration_results"]) assert all(isinstance(entry, OptimizeResult) for entry in ms_info["local_optima"]) assert all(isinstance(entry, pd.DataFrame) for entry in ms_info["start_parameters"]) - assert np.allclose(res.criterion, 0) + assert np.allclose(res.fun, 0) aaae(res.params["value"], np.zeros(4)) diff --git a/tests/optimagic/optimization/test_optimize.py b/tests/optimagic/optimization/test_optimize.py index e5bc74d5f..2f9b86d84 100644 --- a/tests/optimagic/optimization/test_optimize.py +++ b/tests/optimagic/optimization/test_optimize.py @@ -17,7 +17,7 @@ def test_sign_is_switched_back_after_maximization(): algorithm="scipy_lbfgsb", ) - assert np.allclose(res.criterion, 1) + assert np.allclose(res.fun, 1) def test_scipy_lbfgsb_actually_calls_criterion_and_derivative(): diff --git a/tests/optimagic/optimization/test_optimize_result.py b/tests/optimagic/optimization/test_optimize_result.py index a32470c92..b121fcf59 100644 --- a/tests/optimagic/optimization/test_optimize_result.py +++ b/tests/optimagic/optimization/test_optimize_result.py @@ -31,14 +31,14 @@ def convergence_report(): def base_inputs(): out = { "params": np.ones(3), - "criterion": 500, - "start_criterion": 1000, + "fun": 500, + "start_fun": 1000, "start_params": np.full(3, 10), "direction": "minimize", "message": "OPTIMIZATION TERMINATED SUCCESSFULLY", "success": True, - "n_criterion_evaluations": 100, - "n_derivative_evaluations": 0, + "n_fun_evals": 100, + "n_jac_evals": 0, "n_iterations": 80, "history": {"criterion": list(range(10))}, "algorithm": "scipy_lbfgsb", diff --git a/tests/test_deprecations.py b/tests/test_deprecations.py index 321753152..a492b9f5a 100644 --- a/tests/test_deprecations.py +++ b/tests/test_deprecations.py @@ -143,8 +143,8 @@ def test_estimagic_optimize_result_is_deprecated(): with pytest.warns(FutureWarning, match=msg): OptimizeResult( params=res.params, - criterion=res.criterion, - start_criterion=res.start_criterion, + fun=res.fun, + start_fun=res.start_fun, start_params=res.start_params, algorithm=res.algorithm, direction=res.direction, @@ -370,3 +370,21 @@ def test_old_convergence_criteria_are_deprecated(algo_option): algorithm="scipy_lbfgsb", algo_options=algo_option, ) + + +def test_deprecated_attributes_of_optimize_result(): + res = om.minimize(lambda x: x @ x, np.arange(3), algorithm="scipy_lbfgsb") + + msg = "attribute is deprecated" + + with pytest.warns(FutureWarning, match=msg): + _ = res.n_criterion_evaluations + + with pytest.warns(FutureWarning, match=msg): + _ = res.n_derivative_evaluations + + with pytest.warns(FutureWarning, match=msg): + _ = res.criterion + + with pytest.warns(FutureWarning, match=msg): + _ = res.start_criterion From 282ec4229908a40fc3902757b573ba9d91bec1b5 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Fri, 19 Jul 2024 11:51:19 +0200 Subject: [PATCH 20/25] Use | instead of unions in type hints. --- src/estimagic/estimate_ml.py | 14 ++-- src/optimagic/optimization/optimize_result.py | 72 +++++++++++-------- src/optimagic/optimizers/_pounders/bntr.py | 12 ++-- src/optimagic/optimizers/_pounders/gqtpar.py | 12 ++-- .../optimizers/_pounders/linear_subsolvers.py | 6 +- .../_pounders/pounders_auxiliary.py | 14 ++-- src/optimagic/typing.py | 4 ++ 7 files changed, 76 insertions(+), 58 deletions(-) create mode 100644 src/optimagic/typing.py diff --git a/src/estimagic/estimate_ml.py b/src/estimagic/estimate_ml.py index a6b326ac9..81fde607f 100644 --- a/src/estimagic/estimate_ml.py +++ b/src/estimagic/estimate_ml.py @@ -1,7 +1,7 @@ import warnings from dataclasses import dataclass, field from functools import cached_property -from typing import Any, Dict, Union +from typing import Any, Dict import numpy as np import pandas as pd @@ -359,14 +359,14 @@ class LikelihoodResult: _free_estimates: FreeParams _converter: Converter _has_constraints: bool - _optimize_result: Union[OptimizeResult, None] = None + _optimize_result: OptimizeResult | None = None _jacobian: Any = None - _no_jacobian_reason: Union[str, None] = None + _no_jacobian_reason: str | None = None _hessian: Any = None - _no_hessian_reason: Union[str, None] = None - _internal_jacobian: Union[np.ndarray, None] = None - _internal_hessian: Union[np.ndarray, None] = None - _design_info: Union[pd.DataFrame, None] = None + _no_hessian_reason: str | None = None + _internal_jacobian: np.ndarray | None = None + _internal_hessian: np.ndarray | None = None + _design_info: pd.DataFrame | None = None _cache: Dict = field(default_factory=dict) def __post_init__(self): diff --git a/src/optimagic/optimization/optimize_result.py b/src/optimagic/optimization/optimize_result.py index 334728246..7bba3ee3e 100644 --- a/src/optimagic/optimization/optimize_result.py +++ b/src/optimagic/optimization/optimize_result.py @@ -1,5 +1,5 @@ from dataclasses import dataclass, field -from typing import Any, Dict, Union +from typing import Any, Dict import numpy as np import pandas as pd @@ -7,6 +7,7 @@ from optimagic.utilities import to_pickle from optimagic.shared.compat import pd_df_map import warnings +from optimagic.typing import PyTree @dataclass @@ -16,25 +17,22 @@ class OptimizeResult: **Attributes** Attributes: - params (Any): The optimal parameters. - fun (float): The optimal criterion value. - start_fun (float): The criterion value at the start parameters. - start_params (Any): The start parameters. - algorithm (str): The algorithm used for the optimization. - direction (str): Maximize or minimize. - n_free (int): Number of free parameters. - message (Union[str, None] = None): Message returned by the underlying algorithm. - success (Union[bool, None] = None): Whether the optimization was successful. - n_criterion_evaluations (Union[int, None] = None): Number of criterion - evaluations. - n_derivative_evaluations (Union[int, None] = None): Number of - derivative evaluations. - n_iterations (Union[int, None] = None): Number of iterations until termination. - history (Union[Dict, None] = None): Optimization history. - convergence_report (Union[Dict, None] = None): The convergence report. - multistart_info (Union[Dict, None] = None): Multistart information. - algorithm_output (Dict = field(default_factory=dict)): Additional algorithm - specific information. + params: The optimal parameters. + fun: The optimal criterion value. + start_fun: The criterion value at the start parameters. + start_params: The start parameters. + algorithm: The algorithm used for the optimization. + direction: Maximize or minimize. + n_free: Number of free parameters. + message: Message returned by the underlying algorithm. + success: Whether the optimization was successful. + n_fun_evals: Number of criterion evaluations. + n_jac_evals: Number of derivative evaluations. + n_iterations: Number of iterations until termination. + history: Optimization history. + convergence_report: The convergence report. + multistart_info: Multistart information. + algorithm_output: Additional algorithm specific information. """ @@ -46,19 +44,25 @@ class OptimizeResult: direction: str n_free: int - message: Union[str, None] = None - success: Union[bool, None] = None - n_fun_evals: Union[int, None] = None - n_jac_evals: Union[int, None] = None - n_iterations: Union[int, None] = None + message: str | None = None + success: bool | None = None + n_fun_evals: int | None = None + n_jac_evals: int | None = None + n_iterations: int | None = None + status: int | None = None + jac: PyTree | None = None - history: Union[Dict, None] = None + history: Dict | None = None - convergence_report: Union[Dict, None] = None + convergence_report: Dict | None = None - multistart_info: Union[Dict, None] = None + multistart_info: Dict | None = None algorithm_output: Dict = field(default_factory=dict) + # ================================================================================== + # Deprecations + # ================================================================================== + @property def criterion(self): msg = "The criterion attribute is deprecated. Use the fun attribute instead." @@ -92,6 +96,18 @@ def n_derivative_evaluations(self): warnings.warn(msg, FutureWarning) return self.n_jac_evals + # ================================================================================== + # Scipy aliases + # ================================================================================== + + @property + def x(self): + return self.params + + @property + def x0(self): + return self.start_params + def __repr__(self): first_line = ( f"{self.direction.title()} with {self.n_free} free parameters terminated" diff --git a/src/optimagic/optimizers/_pounders/bntr.py b/src/optimagic/optimizers/_pounders/bntr.py index cfe1f6d6f..14d428dc6 100644 --- a/src/optimagic/optimizers/_pounders/bntr.py +++ b/src/optimagic/optimizers/_pounders/bntr.py @@ -1,7 +1,7 @@ """Auxiliary functions for the quadratic BNTR trust-region subsolver.""" from functools import reduce -from typing import NamedTuple, Union +from typing import NamedTuple import numpy as np from optimagic.optimizers._pounders._conjugate_gradient import ( @@ -16,11 +16,11 @@ class ActiveBounds(NamedTuple): - lower: Union[np.ndarray, None] = None - upper: Union[np.ndarray, None] = None - fixed: Union[np.ndarray, None] = None - active: Union[np.ndarray, None] = None - inactive: Union[np.ndarray, None] = None + lower: np.ndarray | None = None + upper: np.ndarray | None = None + fixed: np.ndarray | None = None + active: np.ndarray | None = None + inactive: np.ndarray | None = None def bntr( diff --git a/src/optimagic/optimizers/_pounders/gqtpar.py b/src/optimagic/optimizers/_pounders/gqtpar.py index d658ba402..a31e59b6a 100644 --- a/src/optimagic/optimizers/_pounders/gqtpar.py +++ b/src/optimagic/optimizers/_pounders/gqtpar.py @@ -1,6 +1,6 @@ """Auxiliary functions for the quadratic GQTPAR trust-region subsolver.""" -from typing import NamedTuple, Union +from typing import NamedTuple import numpy as np from scipy.linalg import cho_solve, solve_triangular @@ -9,15 +9,15 @@ class HessianInfo(NamedTuple): - hessian_plus_lambda: Union[np.ndarray, None] = None # shape (n_params, n_params) - upper_triangular: Union[np.ndarray, None] = None # shape (n_params, n_params) + hessian_plus_lambda: np.ndarray | None = None # shape (n_params, n_params) + upper_triangular: np.ndarray | None = None # shape (n_params, n_params) already_factorized: bool = False class DampingFactors(NamedTuple): - candidate: Union[float, None] = None - lower_bound: Union[float, None] = None - upper_bound: Union[float, None] = None + candidate: float | None = None + lower_bound: float | None = None + upper_bound: float | None = None def gqtpar(model, x_candidate, *, k_easy=0.1, k_hard=0.2, maxiter=200): diff --git a/src/optimagic/optimizers/_pounders/linear_subsolvers.py b/src/optimagic/optimizers/_pounders/linear_subsolvers.py index be33fb4a5..dba336b1b 100644 --- a/src/optimagic/optimizers/_pounders/linear_subsolvers.py +++ b/src/optimagic/optimizers/_pounders/linear_subsolvers.py @@ -1,13 +1,13 @@ """Collection of linear trust-region subsolvers.""" -from typing import NamedTuple, Union +from typing import NamedTuple import numpy as np class LinearModel(NamedTuple): - intercept: Union[float, None] = None - linear_terms: Union[np.ndarray, None] = None # shape (n_params, n_params) + intercept: float | None = None + linear_terms: np.ndarray | None = None # shape (n_params, n_params) def minimize_trsbox_linear( diff --git a/src/optimagic/optimizers/_pounders/pounders_auxiliary.py b/src/optimagic/optimizers/_pounders/pounders_auxiliary.py index d598d3c25..643c7dbc6 100644 --- a/src/optimagic/optimizers/_pounders/pounders_auxiliary.py +++ b/src/optimagic/optimizers/_pounders/pounders_auxiliary.py @@ -1,6 +1,6 @@ """Auxiliary functions for the pounders algorithm.""" -from typing import NamedTuple, Union +from typing import NamedTuple import numpy as np from scipy.linalg import qr_multiply @@ -14,16 +14,14 @@ class ResidualModel(NamedTuple): - intercepts: Union[np.ndarray, None] = None # shape (n_residuals,) - linear_terms: Union[np.ndarray, None] = None # shape (n_residuals, n_params) - square_terms: Union[np.ndarray, None] = ( - None # shape (n_residuals, n_params, n_params) - ) + intercepts: np.ndarray | None = None # shape (n_residuals,) + linear_terms: np.ndarray | None = None # shape (n_residuals, n_params) + square_terms: np.ndarray | None = None # shape (n_residuals, n_params, n_params) class MainModel(NamedTuple): - linear_terms: Union[np.ndarray, None] = None # shape (n_params,) - square_terms: Union[np.ndarray, None] = None # shape (n_params, n_params) + linear_terms: np.ndarray | None = None # shape (n_params,) + square_terms: np.ndarray | None = None # shape (n_params, n_params) def create_initial_residual_model(history, accepted_index, delta): diff --git a/src/optimagic/typing.py b/src/optimagic/typing.py new file mode 100644 index 000000000..f3fb9a5c1 --- /dev/null +++ b/src/optimagic/typing.py @@ -0,0 +1,4 @@ +from typing import Any + + +PyTree = Any From b5cff07facd2de4c5f31599ab0fd723ab21a395c Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Fri, 19 Jul 2024 11:59:35 +0200 Subject: [PATCH 21/25] Add aliases. --- src/optimagic/optimization/optimize_result.py | 34 +++++++++++++++---- 1 file changed, 27 insertions(+), 7 deletions(-) diff --git a/src/optimagic/optimization/optimize_result.py b/src/optimagic/optimization/optimize_result.py index 7bba3ee3e..b2a07fced 100644 --- a/src/optimagic/optimization/optimize_result.py +++ b/src/optimagic/optimization/optimize_result.py @@ -48,9 +48,13 @@ class OptimizeResult: success: bool | None = None n_fun_evals: int | None = None n_jac_evals: int | None = None + n_hess_evals: int | None = None n_iterations: int | None = None status: int | None = None jac: PyTree | None = None + hess: PyTree | None = None + hess_inv: PyTree | None = None + max_constaint_violation: float | None = None history: Dict | None = None @@ -64,13 +68,13 @@ class OptimizeResult: # ================================================================================== @property - def criterion(self): + def criterion(self) -> float: msg = "The criterion attribute is deprecated. Use the fun attribute instead." warnings.warn(msg, FutureWarning) return self.fun @property - def start_criterion(self): + def start_criterion(self) -> float: msg = ( "The start_criterion attribute is deprecated. Use the start_fun attribute " "instead." @@ -79,7 +83,7 @@ def start_criterion(self): return self.start_fun @property - def n_criterion_evaluations(self): + def n_criterion_evaluations(self) -> int | None: msg = ( "The n_criterion_evaluations attribute is deprecated. Use the n_fun_evals " "attribute instead." @@ -88,7 +92,7 @@ def n_criterion_evaluations(self): return self.n_fun_evals @property - def n_derivative_evaluations(self): + def n_derivative_evaluations(self) -> int | None: msg = ( "The n_derivative_evaluations attribute is deprecated. Use the n_jac_evals " "attribute instead." @@ -101,14 +105,30 @@ def n_derivative_evaluations(self): # ================================================================================== @property - def x(self): + def x(self) -> PyTree: return self.params @property - def x0(self): + def x0(self) -> PyTree: return self.start_params - def __repr__(self): + @property + def nfev(self) -> int | None: + return self.n_fun_evals + + @property + def nit(self) -> int | None: + return self.n_iterations + + @property + def njev(self) -> int | None: + return self.n_jac_evals + + @property + def nhev(self) -> int | None: + return self.n_hess_evals + + def __repr__(self) -> str: first_line = ( f"{self.direction.title()} with {self.n_free} free parameters terminated" ) From e19eb4e616eb3ad2151e310c96fe63a1cb0477aa Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Fri, 19 Jul 2024 12:00:57 +0200 Subject: [PATCH 22/25] Fix. --- src/optimagic/optimizers/nag_optimizers.py | 2 +- src/optimagic/optimizers/scipy_optimizers.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/src/optimagic/optimizers/nag_optimizers.py b/src/optimagic/optimizers/nag_optimizers.py index 9c1dab381..e6728899d 100644 --- a/src/optimagic/optimizers/nag_optimizers.py +++ b/src/optimagic/optimizers/nag_optimizers.py @@ -662,7 +662,7 @@ def _process_nag_result(nag_result_obj, len_x): """ processed = { "solution_criterion": nag_result_obj.f, - "n_criterion_evaluations": nag_result_obj.nx, + "n_fun_evals": nag_result_obj.nx, "message": nag_result_obj.msg, "success": nag_result_obj.flag == nag_result_obj.EXIT_SUCCESS, "reached_convergence_criterion": None, diff --git a/src/optimagic/optimizers/scipy_optimizers.py b/src/optimagic/optimizers/scipy_optimizers.py index 7b459c5f3..86ab4f1ab 100644 --- a/src/optimagic/optimizers/scipy_optimizers.py +++ b/src/optimagic/optimizers/scipy_optimizers.py @@ -669,7 +669,7 @@ def scipy_brute( out = { "solution_x": res[0], "solution_criterion": res[1], - "n_criterion_evaluations": res[2].size, + "n_fun_evals": res[2].size, "n_iterations": res[2].size, "success": True, "message": "brute force optimization terminated successfully", From e18714295ff580a781b6ca573b7e252f40bfbc51 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Fri, 19 Jul 2024 12:05:19 +0200 Subject: [PATCH 23/25] Add dict access. --- src/optimagic/optimization/optimize_result.py | 3 +++ tests/optimagic/optimization/test_optimize_result.py | 6 ++++++ 2 files changed, 9 insertions(+) diff --git a/src/optimagic/optimization/optimize_result.py b/src/optimagic/optimization/optimize_result.py index b2a07fced..5eff28347 100644 --- a/src/optimagic/optimization/optimize_result.py +++ b/src/optimagic/optimization/optimize_result.py @@ -128,6 +128,9 @@ def njev(self) -> int | None: def nhev(self) -> int | None: return self.n_hess_evals + def __getitem__(self, key): + return getattr(self, key) + def __repr__(self) -> str: first_line = ( f"{self.direction.title()} with {self.n_free} free parameters terminated" diff --git a/tests/optimagic/optimization/test_optimize_result.py b/tests/optimagic/optimization/test_optimize_result.py index b121fcf59..24100bf6b 100644 --- a/tests/optimagic/optimization/test_optimize_result.py +++ b/tests/optimagic/optimization/test_optimize_result.py @@ -68,3 +68,9 @@ def test_to_pickle(base_inputs, convergence_report, tmp_path): **base_inputs, ) res.to_pickle(tmp_path / "bla.pkl") + + +def test_dict_access(base_inputs): + res = OptimizeResult(**base_inputs) + assert res["fun"] == 500 + assert res["nfev"] == 100 From d697cae1d366ae2146858f17fde6d582a610ac98 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Fri, 19 Jul 2024 12:59:24 +0200 Subject: [PATCH 24/25] Adjust documentation. --- .../tutorials/bootstrap_overview.ipynb | 34 +- .../tutorials/likelihood_overview.ipynb | 346 +++++++++++++++++- .../why_optimization_is_hard.ipynb | 154 +------- .../how_to/how_to_algorithm_selection.ipynb | 26 +- .../how_to/how_to_batch_evaluators.ipynb | 42 --- docs/source/how_to/how_to_benchmarking.ipynb | 6 +- docs/source/how_to/how_to_bounds.ipynb | 73 ++-- docs/source/how_to/how_to_constraints.md | 34 +- .../how_to_errors_during_optimization.ipynb | 2 +- docs/source/how_to/how_to_logging.ipynb | 6 +- docs/source/how_to/how_to_multistart.ipynb | 24 +- docs/source/how_to/how_to_scaling.md | 6 +- docs/source/how_to/how_to_start_parameters.md | 8 +- docs/source/how_to/index.md | 1 - .../tutorials/optimization_overview.ipynb | 56 +-- 15 files changed, 479 insertions(+), 339 deletions(-) delete mode 100644 docs/source/how_to/how_to_batch_evaluators.ipynb diff --git a/docs/source/estimagic/tutorials/bootstrap_overview.ipynb b/docs/source/estimagic/tutorials/bootstrap_overview.ipynb index 5f6dbd467..c27bfa24b 100644 --- a/docs/source/estimagic/tutorials/bootstrap_overview.ipynb +++ b/docs/source/estimagic/tutorials/bootstrap_overview.ipynb @@ -15,7 +15,7 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 1, "metadata": {}, "outputs": [], "source": [ @@ -42,9 +42,9 @@ "name": "stderr", "output_type": "stream", "text": [ - "/var/folders/gf/_b8vq9wn2sv2221129y0c3sh0000gn/T/ipykernel_82008/2496026297.py:3: FutureWarning: Downcasting behavior in `replace` is deprecated and will be removed in a future version. To retain the old behavior, explicitly call `result.infer_objects(copy=False)`. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)`\n", + "/var/folders/gf/_b8vq9wn2sv2221129y0c3sh0000gn/T/ipykernel_90869/2496026297.py:3: FutureWarning: Downcasting behavior in `replace` is deprecated and will be removed in a future version. To retain the old behavior, explicitly call `result.infer_objects(copy=False)`. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)`\n", " df = df.replace({\"time\": replacements})\n", - "/var/folders/gf/_b8vq9wn2sv2221129y0c3sh0000gn/T/ipykernel_82008/2496026297.py:3: FutureWarning: The behavior of Series.replace (and DataFrame.replace) with CategoricalDtype is deprecated. In a future version, replace will only be used for cases that preserve the categories. To change the categories, use ser.cat.rename_categories instead.\n", + "/var/folders/gf/_b8vq9wn2sv2221129y0c3sh0000gn/T/ipykernel_90869/2496026297.py:3: FutureWarning: The behavior of Series.replace (and DataFrame.replace) with CategoricalDtype is deprecated. In a future version, replace will only be used for cases that preserve the categories. To change the categories, use ser.cat.rename_categories instead.\n", " df = df.replace({\"time\": replacements})\n" ] }, @@ -202,11 +202,11 @@ { "data": { "text/plain": [ - "(constant 90.857208\n", - " time 0.141391\n", + "(constant 90.810164\n", + " time 0.147692\n", " dtype: float64,\n", - " constant 96.738019\n", - " time 0.633684\n", + " constant 96.676859\n", + " time 0.632926\n", " dtype: float64)" ] }, @@ -228,8 +228,8 @@ { "data": { "text/plain": [ - "constant 1.496127\n", - "time 0.127750\n", + "constant 1.494204\n", + "time 0.123496\n", "dtype: float64" ] }, @@ -259,11 +259,11 @@ { "data": { "text/plain": [ - "(constant 91.345295\n", - " time 0.199327\n", + "(constant 91.416070\n", + " time 0.194815\n", " dtype: float64,\n", - " constant 96.264179\n", - " time 0.612123\n", + " constant 96.377676\n", + " time 0.606278\n", " dtype: float64)" ] }, @@ -304,8 +304,8 @@ { "data": { "text/plain": [ - "constant 1.207991\n", - "time 0.100024\n", + "constant 1.156068\n", + "time 0.100937\n", "dtype: float64" ] }, @@ -633,7 +633,7 @@ }, { "cell_type": "code", - "execution_count": 19, + "execution_count": 17, "metadata": {}, "outputs": [ { @@ -787,7 +787,7 @@ "[90 rows x 6 columns]" ] }, - "execution_count": 19, + "execution_count": 17, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/source/estimagic/tutorials/likelihood_overview.ipynb b/docs/source/estimagic/tutorials/likelihood_overview.ipynb index 8b46b836c..fc94478f8 100644 --- a/docs/source/estimagic/tutorials/likelihood_overview.ipynb +++ b/docs/source/estimagic/tutorials/likelihood_overview.ipynb @@ -30,7 +30,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 1, "metadata": {}, "outputs": [], "source": [ @@ -51,7 +51,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 2, "metadata": {}, "outputs": [], "source": [ @@ -64,9 +64,66 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 3, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
valuelower_bound
intercept2-inf
slope-1-inf
sd11.000000e-10
\n", + "
" + ], + "text/plain": [ + " value lower_bound\n", + "intercept 2 -inf\n", + "slope -1 -inf\n", + "sd 1 1.000000e-10" + ] + }, + "execution_count": 3, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "true_params = pd.DataFrame(\n", " data=[[2, -np.inf], [-1, -np.inf], [1, 1e-10]],\n", @@ -78,7 +135,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 4, "metadata": {}, "outputs": [], "source": [ @@ -94,7 +151,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 5, "metadata": {}, "outputs": [], "source": [ @@ -127,7 +184,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 6, "metadata": {}, "outputs": [], "source": [ @@ -143,9 +200,86 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 7, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
valuestandard_errorci_lowerci_upperp_valuefreestars
intercept1.9450.1041.7422.1480.0True***
slope-0.9450.113-1.167-0.7230.0True***
sd0.9540.0790.7991.1090.0True***
\n", + "
" + ], + "text/plain": [ + " value standard_error ci_lower ci_upper p_value free stars\n", + "intercept 1.945 0.104 1.742 2.148 0.0 True ***\n", + "slope -0.945 0.113 -1.167 -0.723 0.0 True ***\n", + "sd 0.954 0.079 0.799 1.109 0.0 True ***" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "res.summary().round(3)" ] @@ -163,33 +297,213 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 8, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
valuelower_bound
intercept1.944964-inf
slope-0.944918-inf
sd0.9542301.000000e-10
\n", + "
" + ], + "text/plain": [ + " value lower_bound\n", + "intercept 1.944964 -inf\n", + "slope -0.944918 -inf\n", + "sd 0.954230 1.000000e-10" + ] + }, + "execution_count": 8, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "res.params" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 9, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
interceptslopesd
intercept0.0089860.000426-0.001904
slope0.0004260.0077340.000303
sd-0.0019040.0003030.003748
\n", + "
" + ], + "text/plain": [ + " intercept slope sd\n", + "intercept 0.008986 0.000426 -0.001904\n", + "slope 0.000426 0.007734 0.000303\n", + "sd -0.001904 0.000303 0.003748" + ] + }, + "execution_count": 9, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "res.cov(method=\"robust\")" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 10, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
valuelower_bound
intercept0.103760-inf
slope0.113342-inf
sd0.0789601.000000e-10
\n", + "
" + ], + "text/plain": [ + " value lower_bound\n", + "intercept 0.103760 -inf\n", + "slope 0.113342 -inf\n", + "sd 0.078960 1.000000e-10" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "res.se()" ] } ], "metadata": { + "kernelspec": { + "display_name": "optimagic", + "language": "python", + "name": "python3" + }, "language_info": { "codemirror_mode": { "name": "ipython", @@ -200,7 +514,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.9.13" + "version": "3.10.14" } }, "nbformat": 4, diff --git a/docs/source/explanation/why_optimization_is_hard.ipynb b/docs/source/explanation/why_optimization_is_hard.ipynb index c9b99aaaa..bd59bd76a 100644 --- a/docs/source/explanation/why_optimization_is_hard.ipynb +++ b/docs/source/explanation/why_optimization_is_hard.ipynb @@ -29,7 +29,6 @@ "source": [ "import optimagic as om\n", "import numpy as np\n", - "import pandas as pd\n", "import seaborn as sns" ] }, @@ -39,12 +38,12 @@ "metadata": {}, "outputs": [], "source": [ - "def sphere(params):\n", - " return (params[\"value\"] ** 2).sum()\n", + "def sphere(x):\n", + " return x @ x\n", "\n", "\n", - "def sphere_gradient(params):\n", - " return params * 2" + "def sphere_gradient(x):\n", + " return 2 * x" ] }, { @@ -151,85 +150,17 @@ "metadata": {}, "outputs": [], "source": [ - "def sphere_with_noise(params, rng):\n", - " return sphere(params) + rng.normal(scale=0.02)" + "def sphere_with_noise(x, rng):\n", + " return sphere(x) + rng.normal(scale=0.02)" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
value
x_01
x_12
x_23
x_34
x_45
\n", - "
" - ], - "text/plain": [ - " value\n", - "x_0 1\n", - "x_1 2\n", - "x_2 3\n", - "x_3 4\n", - "x_4 5" - ] - }, - "execution_count": 7, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ - "start_params = pd.DataFrame(\n", - " data=np.arange(5) + 1,\n", - " columns=[\"value\"],\n", - " index=[f\"x_{i}\" for i in range(5)],\n", - ")\n", - "start_params" + "start_params = np.arange(5)" ] }, { @@ -274,11 +205,11 @@ ], "source": [ "res = om.minimize(\n", - " criterion=sphere_with_noise,\n", + " fun=sphere_with_noise,\n", " params=start_params,\n", " algorithm=\"scipy_lbfgsb\",\n", " logging=False,\n", - " criterion_kwargs={\"rng\": rng},\n", + " fun_kwargs={\"rng\": rng},\n", ")\n", "\n", "res.success" @@ -291,60 +222,8 @@ "outputs": [ { "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
value
x_01.0
x_12.0
x_23.0
x_34.0
x_45.0
\n", - "
" - ], "text/plain": [ - " value\n", - "x_0 1.0\n", - "x_1 2.0\n", - "x_2 3.0\n", - "x_3 4.0\n", - "x_4 5.0" + "array([0., 1., 2., 3., 4.])" ] }, "execution_count": 10, @@ -389,10 +268,8 @@ "metadata": {}, "outputs": [], "source": [ - "def piecewise_constant_sphere(params):\n", - " params = params.copy(deep=True)\n", - " params[\"value\"] = params[\"value\"].round(2)\n", - " return sphere(params)" + "def piecewise_constant_sphere(x):\n", + " return sphere(x.round(2))" ] }, { @@ -425,7 +302,7 @@ "text/plain": [ "Minimize with 5 free parameters terminated successfully after 1 criterion evaluations, 1 derivative evaluations and 0 iterations.\n", "\n", - "The value of criterion improved from 55.0 to 55.0.\n", + "The value of criterion improved from 30 to 30.0.\n", "\n", "The scipy_lbfgsb algorithm reported: CONVERGENCE: NORM_OF_PROJECTED_GRADIENT_<=_PGTOL" ] @@ -437,10 +314,9 @@ ], "source": [ "res = om.minimize(\n", - " criterion=piecewise_constant_sphere,\n", + " fun=piecewise_constant_sphere,\n", " params=start_params,\n", " algorithm=\"scipy_lbfgsb\",\n", - " logging=False,\n", ")\n", "\n", "res" diff --git a/docs/source/how_to/how_to_algorithm_selection.ipynb b/docs/source/how_to/how_to_algorithm_selection.ipynb index 95a2b769c..e7a898172 100644 --- a/docs/source/how_to/how_to_algorithm_selection.ipynb +++ b/docs/source/how_to/how_to_algorithm_selection.ipynb @@ -67,7 +67,7 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 4, "metadata": {}, "outputs": [ { @@ -76,19 +76,19 @@ "3" ] }, - "execution_count": 3, + "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=start_params,\n", " algorithm=\"scipy_lbfgsb\",\n", - " derivative=sphere_gradient,\n", + " jac=sphere_gradient,\n", ")\n", - "res.n_criterion_evaluations" + "res.n_fun_evals" ] }, { @@ -120,7 +120,7 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 5, "metadata": {}, "outputs": [ { @@ -129,18 +129,18 @@ "33" ] }, - "execution_count": 4, + "execution_count": 5, "metadata": {}, "output_type": "execute_result" } ], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=start_params,\n", " algorithm=\"nag_pybobyqa\",\n", ")\n", - "res.n_criterion_evaluations" + "res.n_fun_evals" ] }, { @@ -159,7 +159,7 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 6, "metadata": {}, "outputs": [ { @@ -168,18 +168,18 @@ "9" ] }, - "execution_count": 5, + "execution_count": 6, "metadata": {}, "output_type": "execute_result" } ], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=start_params,\n", " algorithm=\"nag_dfols\",\n", ")\n", - "res.n_criterion_evaluations" + "res.n_fun_evals" ] } ], diff --git a/docs/source/how_to/how_to_batch_evaluators.ipynb b/docs/source/how_to/how_to_batch_evaluators.ipynb deleted file mode 100644 index 58dff24c6..000000000 --- a/docs/source/how_to/how_to_batch_evaluators.ipynb +++ /dev/null @@ -1,42 +0,0 @@ -{ - "cells": [ - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# How to use batch evaluators" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "(to be written.)\n", - "\n", - "In case of an urgent request for this guide, feel free to open an issue \n", - "[here](https://github.com/OpenSourceEconomics/optimagic/issues)." - ] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3 (ipykernel)", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.10.8" - } - }, - "nbformat": 4, - "nbformat_minor": 2 -} diff --git a/docs/source/how_to/how_to_benchmarking.ipynb b/docs/source/how_to/how_to_benchmarking.ipynb index c2d979fc5..6a433476e 100644 --- a/docs/source/how_to/how_to_benchmarking.ipynb +++ b/docs/source/how_to/how_to_benchmarking.ipynb @@ -619,7 +619,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 13, "id": "96614437", "metadata": {}, "outputs": [], @@ -629,7 +629,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 14, "id": "f9d63ee9", "metadata": {}, "outputs": [ @@ -676,7 +676,7 @@ "Index: []" ] }, - "execution_count": 15, + "execution_count": 14, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/source/how_to/how_to_bounds.ipynb b/docs/source/how_to/how_to_bounds.ipynb index bf1d2cb36..a1939dd7f 100644 --- a/docs/source/how_to/how_to_bounds.ipynb +++ b/docs/source/how_to/how_to_bounds.ipynb @@ -24,7 +24,7 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": 2, "id": "ec477eb7", "metadata": {}, "outputs": [], @@ -35,18 +35,18 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 3, "id": "b0eb906d", "metadata": {}, "outputs": [], "source": [ - "def criterion(x):\n", + "def fun(x):\n", " return x @ x" ] }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 4, "id": "6b43b46e", "metadata": {}, "outputs": [ @@ -56,13 +56,13 @@ "array([ 0.00000000e+00, -1.33177530e-08, 7.18836679e-09])" ] }, - "execution_count": 3, + "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "res = om.minimize(criterion, params=np.arange(3), algorithm=\"scipy_lbfgsb\")\n", + "res = om.minimize(fun=fun, params=np.arange(3), algorithm=\"scipy_lbfgsb\")\n", "res.params" ] }, @@ -80,7 +80,7 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 5, "id": "0c450bdd", "metadata": {}, "outputs": [ @@ -90,14 +90,14 @@ "array([1., 1., 1.])" ] }, - "execution_count": 4, + "execution_count": 5, "metadata": {}, "output_type": "execute_result" } ], "source": [ "res = om.minimize(\n", - " criterion, params=np.arange(3), lower_bounds=np.ones(3), algorithm=\"scipy_lbfgsb\"\n", + " fun=fun, params=np.arange(3), lower_bounds=np.ones(3), algorithm=\"scipy_lbfgsb\"\n", ")\n", "res.params" ] @@ -112,7 +112,7 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 6, "id": "26c5c0df", "metadata": {}, "outputs": [ @@ -122,14 +122,14 @@ "array([-1.00000000e+00, -3.57647467e-08, 1.00000000e+00])" ] }, - "execution_count": 5, + "execution_count": 6, "metadata": {}, "output_type": "execute_result" } ], "source": [ "res = om.minimize(\n", - " criterion,\n", + " fun=fun,\n", " params=np.arange(3),\n", " algorithm=\"scipy_lbfgsb\",\n", " lower_bounds=np.array([-2, -np.inf, 1]),\n", @@ -150,7 +150,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 7, "id": "9c05eb78", "metadata": {}, "outputs": [], @@ -158,13 +158,13 @@ "params = {\"x\": np.arange(3), \"intercept\": 3}\n", "\n", "\n", - "def criterion(params):\n", + "def fun(params):\n", " return params[\"x\"] @ params[\"x\"] + params[\"intercept\"]" ] }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 8, "id": "ddcc54d4", "metadata": {}, "outputs": [ @@ -175,14 +175,14 @@ " 'intercept': -2.0}" ] }, - "execution_count": 7, + "execution_count": 8, "metadata": {}, "output_type": "execute_result" } ], "source": [ "res = om.minimize(\n", - " criterion,\n", + " fun=fun,\n", " params=params,\n", " algorithm=\"scipy_lbfgsb\",\n", " lower_bounds={\"intercept\": -2},\n", @@ -213,7 +213,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 9, "id": "b4a95453", "metadata": {}, "outputs": [ @@ -278,7 +278,7 @@ "intercept 0 3 -2" ] }, - "execution_count": 8, + "execution_count": 9, "metadata": {}, "output_type": "execute_result" } @@ -295,41 +295,24 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 24, "id": "34d59f01", "metadata": {}, "outputs": [], "source": [ - "def criterion(params):\n", - " value = (\n", - " params.loc[\"x\"][\"value\"] @ params.loc[\"x\"][\"value\"]\n", - " + params.loc[\"intercept\"][\"value\"]\n", - " )\n", - " return float(value) # necessary since value is a pd.Series" + "def fun(params):\n", + " x = params.loc[\"x\"][\"value\"].to_numpy()\n", + " intercept = params.loc[\"intercept\"][\"value\"].iloc[0]\n", + " value = x @ x + intercept\n", + " return float(value)" ] }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 25, "id": "b284ad8a", "metadata": {}, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "/var/folders/gf/_b8vq9wn2sv2221129y0c3sh0000gn/T/ipykernel_45054/313144487.py:6: FutureWarning: Calling float on a single element Series is deprecated and will raise a TypeError in the future. Use float(ser.iloc[0]) instead\n", - " return float(value) # necessary since value is a pd.Series\n", - "/var/folders/gf/_b8vq9wn2sv2221129y0c3sh0000gn/T/ipykernel_45054/313144487.py:6: FutureWarning: Calling float on a single element Series is deprecated and will raise a TypeError in the future. Use float(ser.iloc[0]) instead\n", - " return float(value) # necessary since value is a pd.Series\n", - "/var/folders/gf/_b8vq9wn2sv2221129y0c3sh0000gn/T/ipykernel_45054/313144487.py:6: FutureWarning: Calling float on a single element Series is deprecated and will raise a TypeError in the future. Use float(ser.iloc[0]) instead\n", - " return float(value) # necessary since value is a pd.Series\n", - "/var/folders/gf/_b8vq9wn2sv2221129y0c3sh0000gn/T/ipykernel_45054/313144487.py:6: FutureWarning: Calling float on a single element Series is deprecated and will raise a TypeError in the future. Use float(ser.iloc[0]) instead\n", - " return float(value) # necessary since value is a pd.Series\n", - "/var/folders/gf/_b8vq9wn2sv2221129y0c3sh0000gn/T/ipykernel_45054/313144487.py:6: FutureWarning: Calling float on a single element Series is deprecated and will raise a TypeError in the future. Use float(ser.iloc[0]) instead\n", - " return float(value) # necessary since value is a pd.Series\n" - ] - }, { "data": { "text/html": [ @@ -391,14 +374,14 @@ "intercept 0 -2.0 -2" ] }, - "execution_count": 10, + "execution_count": 25, "metadata": {}, "output_type": "execute_result" } ], "source": [ "res = om.minimize(\n", - " criterion,\n", + " fun,\n", " params=params,\n", " algorithm=\"scipy_lbfgsb\",\n", ")\n", diff --git a/docs/source/how_to/how_to_constraints.md b/docs/source/how_to/how_to_constraints.md index 07f1e820d..07c8e14c9 100644 --- a/docs/source/how_to/how_to_constraints.md +++ b/docs/source/how_to/how_to_constraints.md @@ -34,7 +34,7 @@ you can impose and how you specify them in optimagic: >>> import numpy as np >>> import optimagic as om - >>> def criterion(params): + >>> def fun(params): ... offset = np.linspace(1, 0, len(params)) ... x = params - offset ... return x @ x @@ -48,7 +48,7 @@ The unconstrained optimum of a six-dimensional version of this problem is: .. code-block:: python >>> res = om.minimize( - ... criterion=criterion, + ... fun=fun, ... params=np.array([2.5, 1, 1, 1, 1, -2.5]), ... algorithm="scipy_lbfgsb", ... ) @@ -78,7 +78,7 @@ constraint is imposed via the "loc" key. Generalizations for selecting subsets o .. code-block:: python >>> res = om.minimize( - ... criterion=criterion, + ... fun=fun, ... params=np.array([2.5, 1, 1, 1, 1, -2.5]), ... algorithm="scipy_lbfgsb", ... constraints={"loc": [0, 5], "type": "fixed"}, @@ -105,7 +105,7 @@ constraint is imposed via the "loc" key. Generalizations for selecting subsets o >>> res = om.minimize( - ... criterion=criterion, + ... fun=fun, ... params=np.array([1, 1, 1, 1, 1, 1]), ... algorithm="scipy_lbfgsb", ... constraints={"loc": [1, 2, 3], "type": "increasing"}, @@ -144,7 +144,7 @@ constraint is imposed via the "loc" key. Generalizations for selecting subsets o .. code-block:: python >>> res = om.minimize( - ... criterion=criterion, + ... fun=fun, ... params=np.array([1, 1, 1, 1, 1, 1]), ... algorithm="scipy_lbfgsb", ... constraints={"loc": [3, 0, 4], "type": "decreasing"}, @@ -176,7 +176,7 @@ constraint is imposed via the "loc" key. Generalizations for selecting subsets o .. code-block:: python >>> res = om.minimize( - ... criterion=criterion, + ... fun=fun, ... params=np.array([1, 1, 1, 1, 1, 1]), ... algorithm="scipy_lbfgsb", ... constraints={"loc": [0, 5], "type": "equality"}, @@ -201,7 +201,7 @@ constraint is imposed via the "loc" key. Generalizations for selecting subsets o .. code-block:: python >>> res = om.minimize( - ... criterion=criterion, + ... fun=fun, ... params=np.array([1, 1, 1, 1, 1, 1]), ... algorithm="scipy_lbfgsb", ... constraints={"locs": [[0, 1], [2, 3]], "type": "pairwise_equality"}, @@ -226,7 +226,7 @@ constraint is imposed via the "loc" key. Generalizations for selecting subsets o .. code-block:: python >>> res = om.minimize( - ... criterion=criterion, + ... fun=fun, ... params=np.array([0.3, 0.2, 0.25, 0.25, 1, 1]), ... algorithm="scipy_lbfgsb", ... constraints={"loc": [0, 1, 2, 3], "type": "probability"}, @@ -257,7 +257,7 @@ constraint is imposed via the "loc" key. Generalizations for selecting subsets o .. code-block:: python >>> res = om.minimize( - ... criterion=criterion, + ... fun=fun, ... params=np.ones(6), ... algorithm="scipy_lbfgsb", ... constraints={"loc": [0, 1, 2], "type": "covariance"}, @@ -295,7 +295,7 @@ constraint is imposed via the "loc" key. Generalizations for selecting subsets o .. code-block:: python >>> res = om.minimize( - ... criterion=criterion, + ... fun=fun, ... params=np.ones(6), ... algorithm="scipy_lbfgsb", ... constraints={"loc": [0, 1, 2], "type": "sdcorr"}, @@ -342,7 +342,7 @@ constraint is imposed via the "loc" key. Generalizations for selecting subsets o .. code-block:: python >>> res = om.minimize( - ... criterion=criterion, + ... fun=fun, ... params=np.ones(6), ... algorithm="scipy_lbfgsb", ... constraints={ @@ -388,7 +388,7 @@ constraint is imposed via the "loc" key. Generalizations for selecting subsets o .. code-block:: python >>> res = om.minimize( - ... criterion=criterion, + ... fun=fun, ... params=np.ones(6), ... algorithm="scipy_slsqp", ... constraints={ @@ -422,7 +422,7 @@ constraints simultaneously, simple pass in a list of constraints. For example: .. code-block:: python >>> res = om.minimize( - ... criterion=criterion, + ... fun=fun, ... params=np.ones(6), ... algorithm="scipy_lbfgsb", ... constraints=[ @@ -493,7 +493,7 @@ Below we show how to use each of these selection methods in simple examples .. code-block:: python res = om.minimize( - criterion=some_criterion, + fun=some_fun, params=params, algorithm="scipy_lbfgsb", constraints={"loc": "cutoffs", "type": "increasing"}, @@ -536,7 +536,7 @@ Below we show how to use each of these selection methods in simple examples .. code-block:: python res = om.minimize( - criterion=some_criterion, + fun=some_fun, params=params, algorithm="scipy_lbfgsb", constraints={"query": "category == 'betas' | name == 'a'", "type": "fixed"}, @@ -567,7 +567,7 @@ Below we show how to use each of these selection methods in simple examples .. code-block:: python res = om.minimize( - criterion=some_criterion, + fun=some_fun, params=params, algorithm="scipy_lbfgsb", constraints={"selector": lambda params: params["b"]["d"], "type": "fixed"}, @@ -587,7 +587,7 @@ Below we show how to use each of these selection methods in simple examples res = om.minimize( - criterion=some_criterion, + fun=some_fun, params=params, algorithm="scipy_lbfgsb", constraints={"selector": my_selector, "type": "fixed"}, diff --git a/docs/source/how_to/how_to_errors_during_optimization.ipynb b/docs/source/how_to/how_to_errors_during_optimization.ipynb index 3d5de4bb3..aa296ad05 100644 --- a/docs/source/how_to/how_to_errors_during_optimization.ipynb +++ b/docs/source/how_to/how_to_errors_during_optimization.ipynb @@ -165,7 +165,7 @@ ], "source": [ "res = om.minimize(\n", - " criterion=jennrich_sampson,\n", + " fun=jennrich_sampson,\n", " params=start_x,\n", " algorithm=\"scipy_lbfgsb\",\n", " error_handling=\"continue\",\n", diff --git a/docs/source/how_to/how_to_logging.ipynb b/docs/source/how_to/how_to_logging.ipynb index 86eee78a2..e1c75203d 100644 --- a/docs/source/how_to/how_to_logging.ipynb +++ b/docs/source/how_to/how_to_logging.ipynb @@ -46,7 +46,7 @@ "outputs": [], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=np.arange(5),\n", " algorithm=\"scipy_lbfgsb\",\n", " logging=\"my_log.db\",\n", @@ -73,7 +73,7 @@ "outputs": [], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=np.arange(5),\n", " algorithm=\"scipy_lbfgsb\",\n", " logging=\"my_log.db\",\n", @@ -97,7 +97,7 @@ "outputs": [], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=np.arange(5),\n", " algorithm=\"scipy_lbfgsb\",\n", " logging=\"my_log.db\",\n", diff --git a/docs/source/how_to/how_to_multistart.ipynb b/docs/source/how_to/how_to_multistart.ipynb index 9597fa1bc..409036bcf 100644 --- a/docs/source/how_to/how_to_multistart.ipynb +++ b/docs/source/how_to/how_to_multistart.ipynb @@ -152,7 +152,7 @@ " \n", " \n", " 1\n", - " -0.0\n", + " 0.0\n", " -5\n", " 10\n", " \n", @@ -169,7 +169,7 @@ "text/plain": [ " value soft_lower_bound soft_upper_bound\n", "0 -0.0 -5 10\n", - "1 -0.0 -5 10\n", + "1 0.0 -5 10\n", "2 0.0 -5 10" ] }, @@ -180,7 +180,7 @@ ], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=params,\n", " algorithm=\"scipy_lbfgsb\",\n", " multistart=True,\n", @@ -291,17 +291,17 @@ "text/plain": [ "Minimize with 3 free parameters terminated successfully after 6 criterion evaluations, 6 derivative evaluations and 4 iterations.\n", "\n", - "The value of criterion improved from 14.0 to 6.38558109434918e-18.\n", + "The value of criterion improved from 14.0 to 9.468366080598408e-18.\n", "\n", "The multistart_scipy_lbfgsb algorithm reported: CONVERGENCE: NORM_OF_PROJECTED_GRADIENT_<=_PGTOL\n", "\n", "Independent of the convergence criteria used by multistart_scipy_lbfgsb, the strength of convergence can be assessed by the following criteria:\n", "\n", " one_step five_steps \n", - "relative_criterion_change 3.06e-14*** 3.06e-14***\n", - "relative_params_change 5.482e-07* 5.482e-07* \n", - "absolute_criterion_change 3.06e-15*** 3.06e-15***\n", - "absolute_params_change 5.482e-08* 5.482e-08* \n", + "relative_criterion_change 4.859e-14*** 4.859e-14***\n", + "relative_params_change 7.279e-07* 7.279e-07* \n", + "absolute_criterion_change 4.859e-15*** 4.859e-15***\n", + "absolute_params_change 7.279e-08* 7.279e-08* \n", "\n", "(***: change <= 1e-10, **: change <= 1e-8, *: change <= 1e-5. Change refers to a change between accepted steps. The first column only considers the last step. The second column considers the last five steps.)" ] @@ -313,7 +313,7 @@ ], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=params,\n", " algorithm=\"scipy_lbfgsb\",\n", " multistart=True,\n", @@ -364,7 +364,7 @@ " \n", " \n", " 1\n", - " -0.0\n", + " 0.0\n", " -5\n", " 10\n", " \n", @@ -381,7 +381,7 @@ "text/plain": [ " value soft_lower_bound soft_upper_bound\n", "0 -0.0 -5 10\n", - "1 -0.0 -5 10\n", + "1 0.0 -5 10\n", "2 0.0 -5 10" ] }, @@ -541,7 +541,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.10.8" + "version": "3.10.14" } }, "nbformat": 4, diff --git a/docs/source/how_to/how_to_scaling.md b/docs/source/how_to/how_to_scaling.md index d127cdc5a..22f4efab2 100644 --- a/docs/source/how_to/how_to_scaling.md +++ b/docs/source/how_to/how_to_scaling.md @@ -50,7 +50,7 @@ start_params["lower_bound"] = 0 start_params["upper_bound"] = 2 * np.arange(5) + 1 res = om.minimize( - criterion=sphere, + fun=sphere, params=start_params, algorithm="scipy_lbfgsb", scaling=True, @@ -99,7 +99,7 @@ start_params["lower_bound"] = 0 start_params["upper_bound"] = 2 * np.arange(5) + 1 res = om.minimize( - criterion=sphere, + fun=sphere, params=start_params, algorithm="scipy_lbfgsb", scaling=True, @@ -134,7 +134,7 @@ start_params["lower_bound"] = 0 start_params["upper_bound"] = 2 * np.arange(5) + 1 res = om.minimize( - criterion=sphere, + fun=sphere, params=start_params, algorithm="scipy_lbfgsb", scaling=True, diff --git a/docs/source/how_to/how_to_start_parameters.md b/docs/source/how_to/how_to_start_parameters.md index 55b5daab1..fc5a031e9 100644 --- a/docs/source/how_to/how_to_start_parameters.md +++ b/docs/source/how_to/how_to_start_parameters.md @@ -37,7 +37,7 @@ Again, we use the simple `sphere` function you know from other tutorials as an e om.minimize( - criterion=sphere, + fun=sphere, params=np.arange(3), algorithm="scipy_lbfgsb", ) @@ -66,7 +66,7 @@ Again, we use the simple `sphere` function you know from other tutorials as an e ) om.minimize( - criterion=sphere, + fun=sphere, params=params, algorithm="scipy_lbfgsb", ) @@ -103,7 +103,7 @@ Again, we use the simple `sphere` function you know from other tutorials as an e res = om.minimize( - criterion=sphere, + fun=sphere, params={"a": 0, "b": 1, "c": pd.Series([2, 3, 4])}, algorithm="scipy_neldermead", ) @@ -131,7 +131,7 @@ Again, we use the simple `sphere` function you know from other tutorials as an e om.minimize( - criterion=sphere, + fun=sphere, params=3, algorithm="scipy_lbfgsb", ) diff --git a/docs/source/how_to/index.md b/docs/source/how_to/index.md index f16634510..747a50c24 100644 --- a/docs/source/how_to/index.md +++ b/docs/source/how_to/index.md @@ -21,7 +21,6 @@ how_to_scaling how_to_logging how_to_errors_during_optimization how_to_slice_plot -how_to_batch_evaluators how_to_benchmarking how_to_first_derivative how_to_second_derivative diff --git a/docs/source/tutorials/optimization_overview.ipynb b/docs/source/tutorials/optimization_overview.ipynb index 93cb7e5f9..58b53ba3f 100644 --- a/docs/source/tutorials/optimization_overview.ipynb +++ b/docs/source/tutorials/optimization_overview.ipynb @@ -11,7 +11,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 1, "metadata": {}, "outputs": [], "source": [ @@ -55,7 +55,7 @@ ], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=np.arange(5),\n", " algorithm=\"scipy_lbfgsb\",\n", ")\n", @@ -105,7 +105,7 @@ ], "source": [ "res = om.minimize(\n", - " criterion=dict_sphere,\n", + " fun=dict_sphere,\n", " params={\"a\": 0, \"b\": 1, \"c\": pd.Series([2, 3, 4])},\n", " algorithm=\"scipy_powell\",\n", ")\n", @@ -152,7 +152,7 @@ ], "source": [ "res = om.minimize(\n", - " criterion=dict_sphere,\n", + " fun=dict_sphere,\n", " params={\"a\": 0, \"b\": 1, \"c\": pd.Series([2, 3, 4])},\n", " algorithm=\"scipy_neldermead\",\n", ")\n", @@ -173,7 +173,7 @@ "outputs": [ { "data": { - "image/png": "" + "image/png": "" }, "metadata": {}, "output_type": "display_data" @@ -191,7 +191,7 @@ "outputs": [ { "data": { - "image/png": "" + "image/png": "" }, "metadata": {}, "output_type": "display_data" @@ -247,7 +247,7 @@ ], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=np.arange(5),\n", " algorithm=\"scipy_lbfgsb\",\n", " lower_bounds=np.arange(5) - 2,\n", @@ -282,7 +282,7 @@ ], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=np.arange(5),\n", " algorithm=\"scipy_lbfgsb\",\n", " constraints=[{\"loc\": [1, 3], \"type\": \"fixed\"}],\n", @@ -308,7 +308,7 @@ { "data": { "text/plain": [ - "array([ 0.33334, 0.33333, 0.33333, -0. , 0. ])" + "array([ 0.33333, 0.33333, 0.33334, -0. , 0. ])" ] }, "execution_count": 11, @@ -318,7 +318,7 @@ ], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=np.array([0.1, 0.5, 0.4, 4, 5]),\n", " algorithm=\"scipy_lbfgsb\",\n", " constraints=[{\"loc\": [0, 1, 2], \"type\": \"probability\"}],\n", @@ -363,7 +363,7 @@ { "data": { "text/plain": [ - "array([ 0., -0., -0., 0., -0.])" + "array([ 0., -0., -0., 0., 0.])" ] }, "execution_count": 13, @@ -373,7 +373,7 @@ ], "source": [ "res = om.maximize(\n", - " criterion=upside_down_sphere,\n", + " fun=upside_down_sphere,\n", " params=np.arange(5),\n", " algorithm=\"scipy_bfgs\",\n", ")\n", @@ -410,6 +410,16 @@ "execution_count": 15, "metadata": {}, "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/Users/janosgabler/Dropbox/Projects/optimagic/src/optimagic/deprecations.py:29: FutureWarning:\n", + "\n", + "To align optimagic with scipy.optimize, the `derivative` argument has been renamed to `jac`. Please use `jac` instead of `derivative`. Using `derivative` will become an error in optimagic version 0.6.0 and later.\n", + "\n" + ] + }, { "data": { "text/plain": [ @@ -423,7 +433,7 @@ ], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=np.arange(5),\n", " algorithm=\"scipy_lbfgsb\",\n", " derivative=sphere_gradient,\n", @@ -456,7 +466,7 @@ ], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=np.arange(5),\n", " algorithm=\"scipy_lbfgsb\",\n", " numdiff_options={\"n_cores\": 6},\n", @@ -490,7 +500,7 @@ ], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=np.arange(10),\n", " algorithm=\"scipy_neldermead\",\n", " soft_lower_bounds=np.full(10, -5),\n", @@ -515,7 +525,7 @@ "outputs": [ { "data": { - "image/png": "" + "image/png": "" }, "metadata": {}, "output_type": "display_data" @@ -565,7 +575,7 @@ { "data": { "text/plain": [ - "array([ 0., 0., -0., 0., -0.])" + "array([-0., 0., 0., 0., -0.])" ] }, "execution_count": 20, @@ -575,7 +585,7 @@ ], "source": [ "res = om.minimize(\n", - " criterion=general_sphere,\n", + " fun=general_sphere,\n", " params=np.arange(5),\n", " algorithm=\"pounders\",\n", ")\n", @@ -598,7 +608,7 @@ "outputs": [], "source": [ "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=np.arange(5),\n", " algorithm=\"scipy_lbfgsb\",\n", " logging=\"my_log.db\",\n", @@ -670,12 +680,12 @@ ], "source": [ "algo_options = {\n", - " \"convergence.relative_criterion_tolerance\": 1e-9,\n", - " \"stopping.max_iterations\": 100_000,\n", + " \"convergence.ftol_rel\": 1e-9,\n", + " \"stopping.maxiter\": 100_000,\n", "}\n", "\n", "res = om.minimize(\n", - " criterion=sphere,\n", + " fun=sphere,\n", " params=np.arange(5),\n", " algorithm=\"scipy_lbfgsb\",\n", " algo_options=algo_options,\n", @@ -700,7 +710,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.10.8" + "version": "3.10.14" }, "vscode": { "interpreter": { From da09eba28ce55d6ee896a99a7d25a8ee82fa48f1 Mon Sep 17 00:00:00 2001 From: Janos Gabler Date: Fri, 19 Jul 2024 17:08:48 +0200 Subject: [PATCH 25/25] Fix warning in notebook. --- docs/source/tutorials/optimization_overview.ipynb | 12 +----------- 1 file changed, 1 insertion(+), 11 deletions(-) diff --git a/docs/source/tutorials/optimization_overview.ipynb b/docs/source/tutorials/optimization_overview.ipynb index 58b53ba3f..51a4a4b66 100644 --- a/docs/source/tutorials/optimization_overview.ipynb +++ b/docs/source/tutorials/optimization_overview.ipynb @@ -410,16 +410,6 @@ "execution_count": 15, "metadata": {}, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "/Users/janosgabler/Dropbox/Projects/optimagic/src/optimagic/deprecations.py:29: FutureWarning:\n", - "\n", - "To align optimagic with scipy.optimize, the `derivative` argument has been renamed to `jac`. Please use `jac` instead of `derivative`. Using `derivative` will become an error in optimagic version 0.6.0 and later.\n", - "\n" - ] - }, { "data": { "text/plain": [ @@ -436,7 +426,7 @@ " fun=sphere,\n", " params=np.arange(5),\n", " algorithm=\"scipy_lbfgsb\",\n", - " derivative=sphere_gradient,\n", + " jac=sphere_gradient,\n", ")\n", "res.params.round(5)" ]