Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add pounders filtering to tranquilo #389

Merged
merged 36 commits into from
Oct 30, 2022
Merged
Show file tree
Hide file tree
Changes from 34 commits
Commits
Show all changes
36 commits
Select commit Hold shift + click to select a range
23132f6
Make tranquilo more flexible and fix bug in pounders fitting.
segsell Oct 12, 2022
8bbfc54
Add more tests and fix bug.
segsell Oct 12, 2022
c9700c6
Merge branch 'main' into filtering
segsell Oct 12, 2022
f3f2bad
Add pounders filtering.
segsell Oct 17, 2022
5ef749a
Merge branch 'main' into filtering
segsell Oct 17, 2022
8e1bd64
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Oct 17, 2022
468adbf
Refactor.
segsell Oct 18, 2022
14b7f4d
Rename variables.
segsell Oct 18, 2022
8d9cb71
Add test on linear aggregator.
segsell Oct 19, 2022
1e4ddd3
More tests and fix.
segsell Oct 20, 2022
0648621
Add original pounders fitting.
segsell Oct 21, 2022
9fd2022
Improve fitting.
segsell Oct 21, 2022
5675012
Rename to experimental pounders fitting and add more unit tests.
segsell Oct 22, 2022
080c1cf
Split integration test up into proper, imprecise, and problematic def…
segsell Oct 22, 2022
cd6ba76
Add unit test.
segsell Oct 22, 2022
dcf48a1
Add original pounders fitting.
segsell Oct 22, 2022
5dbee38
Adjust integration tests.
segsell Oct 22, 2022
59c6295
Flag problematic tests failing on other systems.
segsell Oct 22, 2022
f04ade2
[pre-commit.ci] pre-commit autoupdate (#387)
pre-commit-ci[bot] Oct 29, 2022
a3a3f1c
Fix CI?
janosg Oct 29, 2022
a64b0a3
Fix CI?
janosg Oct 29, 2022
cc84d61
Undo.
janosg Oct 29, 2022
dcfca36
Fix CI?
janosg Oct 29, 2022
d97e64d
Fix CI?
janosg Oct 29, 2022
a86f928
Fix CI?
janosg Oct 29, 2022
438be6f
Fix CI?
janosg Oct 29, 2022
ea568a2
Clean up handling of default and user options.
janosg Oct 30, 2022
8edbddc
Merge the two identity aggregators.
janosg Oct 30, 2022
55073e7
Remove fit_pounders_original.
janosg Oct 30, 2022
6bd8998
Remove tests for scalar tranquilo with linear surrogate.
janosg Oct 30, 2022
2bba26e
Improve former flexibel fit and rename to fit_powell.
janosg Oct 30, 2022
8ebbccc
Remove ability to fit models without intercept.
janosg Oct 30, 2022
e2ddcfd
Use intercepts in identity aggregator.
janosg Oct 30, 2022
ce931b7
Remove leftovers from models without intercepts.
janosg Oct 30, 2022
c2394ad
Hardcode aggregator for now.
janosg Oct 30, 2022
74aa852
More function calls with keyword arguments, remove code branches that…
janosg Oct 30, 2022
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
6 changes: 3 additions & 3 deletions .pre-commit-config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -6,7 +6,7 @@ repos:
- id: debug-statements
- id: end-of-file-fixer
- repo: https://github.com/asottile/reorder_python_imports
rev: v3.8.3
rev: v3.8.5
hooks:
- id: reorder-python-imports
types: [python]
Expand Down Expand Up @@ -47,7 +47,7 @@ repos:
additional_dependencies: [black==22.3.0]
exclude: docs/source/how_to_guides/optimization/how_to_specify_constraints.md
- repo: https://github.com/psf/black
rev: 22.8.0
rev: 22.10.0
hooks:
- id: black
language_version: python3.9
Expand All @@ -72,7 +72,7 @@ repos:
- id: check-useless-excludes
# - id: identity # Prints all files passed to pre-commits. Debugging.
- repo: https://github.com/nbQA-dev/nbQA
rev: 1.5.2
rev: 1.5.3
hooks:
- id: nbqa-black
additional_dependencies: [black==22.3.0]
Expand Down
2 changes: 1 addition & 1 deletion src/estimagic/benchmarking/process_benchmark_results.py
Original file line number Diff line number Diff line change
Expand Up @@ -167,7 +167,7 @@ def _make_history_monotone(df, target_col, direction="minimize"):

"""
sorted_df = df.sort_values(["problem", "algorithm", "n_evaluations"])
grouped = sorted_df.groupby(["problem", "algorithm"])[target_col]
grouped = sorted_df.groupby(["problem", "algorithm"], group_keys=False)[target_col]

if direction == "minimize":
out = grouped.apply(np.minimum.accumulate)
Expand Down
32 changes: 12 additions & 20 deletions src/estimagic/optimization/tranquilo/aggregate_models.py
Original file line number Diff line number Diff line change
Expand Up @@ -46,7 +46,7 @@ def get_aggregator(aggregator, functype, model_info):

# determine if aggregator is compatible with functype and model_info
aggregator_compatible_with_functype = {
"scalar": ("identity", "sum"),
"scalar": ("identity", "identity_old", "sum"),
"least_squares": ("least_squares_linear",),
"likelihood": (
"sum",
Expand All @@ -57,13 +57,14 @@ def get_aggregator(aggregator, functype, model_info):
aggregator_compatible_with_model_info = {
# keys are names of aggregators and values are functions of model_info that
# return False in case of incompatibility
"identity": _is_second_order_model,
"identity": lambda x: True,
"sum": _is_second_order_model,
"information_equality_linear": lambda model_info: not _is_second_order_model(
model_info
),
"least_squares_linear": lambda model_info: model_info.has_intercepts
and not _is_second_order_model(model_info),
"least_squares_linear": lambda model_info: not _is_second_order_model(
model_info
),
}

if _using_built_in_aggregator:
Expand All @@ -73,11 +74,6 @@ def get_aggregator(aggregator, functype, model_info):
f"Aggregator {_aggregator_name} is not compatible with functype "
f"{functype}. It would not produce a quadratic main model."
)
if functype == "scalar" and not _is_second_order_model(model_info):
raise ValueError(
f"ModelInfo {model_info} is not compatible with functype scalar. "
"It would not produce a quadratic main model."
)
if not aggregator_compatible_with_model_info[_aggregator_name](model_info):
raise ValueError(
f"ModelInfo {model_info} is not compatible with aggregator "
Expand Down Expand Up @@ -137,9 +133,12 @@ def aggregator_identity(vector_model, fvec_center, model_info):
2. ModelInfo: has squares or interactions

"""
intercept = float(fvec_center)
intercept = float(vector_model.intercepts)
linear_terms = np.squeeze(vector_model.linear_terms)
square_terms = np.squeeze(vector_model.square_terms)
if model_info.has_squares or model_info.has_interactions:
square_terms = np.squeeze(vector_model.square_terms)
else:
square_terms = np.zeros((len(linear_terms), len(linear_terms)))
return intercept, linear_terms, square_terms


Expand All @@ -157,11 +156,7 @@ def aggregator_sum(vector_model, fvec_center, model_info):
2. ModelInfo: has squares or interactions

"""
if model_info.has_intercepts:
vm_intercepts = vector_model.intercepts
else:
vm_intercepts = fvec_center

vm_intercepts = vector_model.intercepts
intercept = vm_intercepts.sum(axis=0)
linear_terms = vector_model.linear_terms.sum(axis=0)
square_terms = vector_model.square_terms.sum(axis=0)
Expand Down Expand Up @@ -210,10 +205,7 @@ def aggregator_information_equality_linear(vector_model, fvec_center, model_info

"""
vm_linear_terms = vector_model.linear_terms
if model_info.has_intercepts:
vm_intercepts = vector_model.intercepts
else:
vm_intercepts = fvec_center
vm_intercepts = vector_model.intercepts

fisher_information = vm_linear_terms.T @ vm_linear_terms

Expand Down
130 changes: 124 additions & 6 deletions src/estimagic/optimization/tranquilo/filter_points.py
Original file line number Diff line number Diff line change
@@ -1,4 +1,6 @@
import numpy as np
from numba import njit
from scipy.linalg import qr_multiply


def get_sample_filter(sample_filter="keep_all"):
Expand All @@ -18,9 +20,10 @@ def get_sample_filter(sample_filter="keep_all"):

"""
built_in_filters = {
"discard_all": _discard_all,
"keep_all": _keep_all,
"drop_collinear": _drop_collinear,
"discard_all": discard_all,
"keep_all": keep_all,
"drop_collinear": drop_collinear,
"drop_pounders": drop_collinear_pounders,
}

if isinstance(sample_filter, str) and sample_filter in built_in_filters:
Expand All @@ -33,14 +36,129 @@ def get_sample_filter(sample_filter="keep_all"):
return out


def _discard_all(xs, indices, state):
def discard_all(xs, indices, state):
return state.x.reshape(1, -1), np.array([state.index])


def _keep_all(xs, indices, state):
def keep_all(xs, indices, state):
return xs, indices


def _drop_collinear(xs, indices, state):
def drop_collinear(xs, indices, state):
"""Make sure that the points that are kept are linearly independent."""
raise NotImplementedError()


def drop_collinear_pounders(xs, indices, state):
"""Drop collinear points using pounders filtering."""
if xs.shape[0] <= xs.shape[1] + 1:
filtered_xs, filtered_indices = xs, indices
else:
filtered_xs, filtered_indices = _drop_collinear_pounders(xs, indices, state)

return filtered_xs, filtered_indices


def _drop_collinear_pounders(xs, indices, state):
theta2 = 1e-4
n_samples, n_params = xs.shape
n_poly_terms = n_params * (n_params + 1) // 2

indices_reverse = indices[::-1]
indexer_reverse = np.arange(n_samples)[::-1]

radius = state.radius
center = state.x
index_center = int(np.where(indices_reverse == state.index)[0])
centered_xs = (xs - center) / radius

(
linear_features,
square_features,
idx_list_n_plus_1,
index,
) = _get_polynomial_feature_matrices(
centered_xs,
indexer_reverse,
index_center,
n_params,
n_samples,
n_poly_terms,
)

indexer_filtered = indexer_reverse[idx_list_n_plus_1].tolist()
_index_center = indexer_reverse[index_center]

counter = n_params + 1

while (counter < n_samples) and (index >= 0):
if index == _index_center:
index -= 1
continue

linear_features[counter, 1:] = centered_xs[index]
square_features[counter, :] = _square_features(linear_features[counter, 1:])

linear_features_pad = np.zeros((n_samples, n_samples))
linear_features_pad[:n_samples, : n_params + 1] = linear_features

n_z_mat, _ = qr_multiply(
linear_features_pad[: counter + 1, :],
square_features.T[:n_poly_terms, : counter + 1],
)
beta = np.linalg.svd(n_z_mat.T[n_params + 1 :], compute_uv=False)

if beta[min(counter - n_params, n_poly_terms) - 1] > theta2:
indexer_filtered += [index]
counter += 1

index -= 1

filtered_indices = indices[indexer_filtered]
filtered_xs = xs[indexer_filtered]

return filtered_xs, filtered_indices


def _get_polynomial_feature_matrices(
centered_xs, indexer, index_center, n_params, n_samples, n_poly_terms
):
linear_features = np.zeros((n_samples, n_params + 1))
square_features = np.zeros((n_samples, n_poly_terms))

linear_features[0, 1:] = centered_xs[indexer[index_center]]
square_features[0, :] = _square_features(linear_features[0, 1:]).flatten()

_is_center_in_head = index_center < n_params
idx_list_n = [i for i in range(n_params + _is_center_in_head) if i != index_center]
idx_list_n_plus_1 = [index_center] + idx_list_n

linear_features[:, 0] = 1
linear_features[: n_params + 1, 1:] = centered_xs[indexer[idx_list_n_plus_1]]
square_features[: n_params + 1, :] = _square_features(
linear_features[: n_params + 1, 1:]
)

idx = n_samples - _is_center_in_head - len(idx_list_n) - 1

return linear_features, square_features, idx_list_n_plus_1, idx


@njit
def _square_features(x):
n_samples, n_params = np.atleast_2d(x).shape
n_poly_terms = n_params * (n_params + 1) // 2

poly_terms = np.empty((n_poly_terms, n_samples), x.dtype)
xt = x.T

idx = 0
for i in range(n_params):
poly_terms[idx] = 0.5 * xt[i] ** 2
idx += 1

for j in range(i + 1, n_params):
poly_terms[idx] = xt[i] * xt[j] / np.sqrt(2)
idx += 1

return poly_terms.T
Loading