Create InSampleEffectsPlot (#2809)

Summary: Pull Request resolved: #2809 Insample effects will be divided by name into modeled and raw. They will use models from GS if applicable and possible and otherwise use TS model. TODO in a follow up: attach the data start and end time in tooltip. Reviewed By: mpolson64 Differential Revision: D63765113 fbshipit-source-id: d8ddac2ccd12a81f8c603fac9caad32a190fc644
facebook · Oct 5, 2024 · f0ac920 · f0ac920
1 parent 71c68ee
commit f0ac920
Show file tree

Hide file tree

Showing 8 changed files with 1,070 additions and 152 deletions.
diff --git a/ax/analysis/plotly/arm_effects/__init__.py b/ax/analysis/plotly/arm_effects/__init__.py
@@ -0,0 +1,9 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+#
+# This source code is licensed under the MIT license found in the
+# LICENSE file in the root directory of this source tree.
+
+from ax.analysis.plotly.arm_effects.insample_effects import InSampleEffectsPlot
+from ax.analysis.plotly.arm_effects.predicted_effects import PredictedEffectsPlot
+
+__all__ = ["PredictedEffectsPlot", "InSampleEffectsPlot"]
diff --git a/ax/analysis/plotly/arm_effects/insample_effects.py b/ax/analysis/plotly/arm_effects/insample_effects.py
@@ -0,0 +1,288 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+#
+# This source code is licensed under the MIT license found in the
+# LICENSE file in the root directory of this source tree.
+
+from itertools import chain
+from logging import Logger
+
+import pandas as pd
+from ax.analysis.analysis import AnalysisCardLevel
+from ax.analysis.plotly.arm_effects.utils import (
+    get_predictions_by_arm,
+    prepare_arm_effects_plot,
+)
+
+from ax.analysis.plotly.plotly_analysis import PlotlyAnalysis, PlotlyAnalysisCard
+from ax.analysis.plotly.utils import is_predictive
+from ax.core.experiment import Experiment
+from ax.core.generation_strategy_interface import GenerationStrategyInterface
+from ax.core.generator_run import GeneratorRun
+from ax.core.outcome_constraint import OutcomeConstraint
+from ax.exceptions.core import DataRequiredError, UserInputError
+from ax.modelbridge.base import ModelBridge
+from ax.modelbridge.generation_strategy import GenerationStrategy
+from ax.modelbridge.registry import Models
+from ax.modelbridge.transforms.derelativize import Derelativize
+from ax.utils.common.logger import get_logger
+from plotly import io as pio
+from pyre_extensions import none_throws
+
+logger: Logger = get_logger(__name__)
+
+
+class InSampleEffectsPlot(PlotlyAnalysis):
+    """
+    Plotly Insample Effecs plot for a single metric on a single trial, with one point
+    per unique arm across all trials. The plot may either use modeled effects, or
+    raw / observed data.
+
+    This plot is useful for understanding how arms compare to eachother for a given
+    metric.
+
+    TODO: Allow trial index to be optional so we can plot all trials for non batch
+    experiments.
+
+    The DataFrame computed will contain one row per arm and the following columns:
+        - source: In-sample or model key that geneerated the candidate
+        - arm_name: The name of the arm
+        - mean: The observed or predicted mean of the metric specified
+        - sem: The observed or predicted sem of the metric specified
+        - error_margin: The 95% CI of the metric specified for the arm
+        - size_column: The size of the circle in the plot, which represents
+            the probability that the arm is feasible (does not violate any
+            constraints).
+        - parameters: A string representation of the parameters for the arm
+            to be viewed in the tooltip.
+        - constraints_violated: A string representation of the probability
+            each constraint is violated for the arm, to be viewed in the tooltip.
+    """
+
+    def __init__(
+        self, metric_name: str, trial_index: int, use_modeled_effects: bool
+    ) -> None:
+        """
+        Args:
+            metric_name: The name of the metric to plot.
+            trial_index: The of the trial to plot arms for.
+            use_modeled_effects: Whether to use modeled effects or show
+                raw effects.
+        """
+
+        self.metric_name = metric_name
+        self.trial_index = trial_index
+        self.use_modeled_effects = use_modeled_effects
+
+    def compute(
+        self,
+        experiment: Experiment | None = None,
+        generation_strategy: GenerationStrategyInterface | None = None,
+    ) -> PlotlyAnalysisCard:
+        if experiment is None:
+            raise UserInputError("InSampleEffectsPlot requires an Experiment.")
+
+        model = _get_model(
+            experiment=experiment,
+            generation_strategy=generation_strategy,
+            use_modeled_effects=self.use_modeled_effects,
+            trial_index=self.trial_index,
+            metric_name=self.metric_name,
+        )
+
+        outcome_constraints = (
+            []
+            if experiment.optimization_config is None
+            else Derelativize()
+            .transform_optimization_config(
+                # TODO[T203521207]: move cloning into transform_optimization_config
+                optimization_config=none_throws(experiment.optimization_config).clone(),
+                modelbridge=model,
+            )
+            .outcome_constraints
+        )
+        df = _prepare_data(
+            experiment=experiment,
+            model=model,
+            outcome_constraints=outcome_constraints,
+            metric_name=self.metric_name,
+            trial_index=self.trial_index,
+            use_modeled_effects=self.use_modeled_effects,
+        )
+        fig = prepare_arm_effects_plot(
+            df=df, metric_name=self.metric_name, outcome_constraints=outcome_constraints
+        )
+
+        if (
+            experiment.optimization_config is None
+            or self.metric_name not in experiment.optimization_config.metrics
+        ):
+            level = AnalysisCardLevel.LOW
+        elif self.metric_name in experiment.optimization_config.objective.metric_names:
+            level = AnalysisCardLevel.HIGH
+        else:
+            level = AnalysisCardLevel.MID
+
+        plot_type = "Modeled" if self.use_modeled_effects else "Raw"
+        subtitle = (
+            "View a trial and its arms' "
+            f"{'predicted' if self.use_modeled_effects else 'observed'} "
+            "metric values"
+        )
+        return PlotlyAnalysisCard(
+            name=f"{plot_type}EffectsPlot",
+            title=(
+                f"{plot_type} Effects for {self.metric_name} "
+                f"on trial {self.trial_index}"
+            ),
+            subtitle=subtitle,
+            level=level,
+            df=df,
+            blob=pio.to_json(fig),
+            attributes={"trial_index": self.trial_index},
+        )
+
+
+def _get_max_observed_trial_index(model: ModelBridge) -> int | None:
+    """Returns the max observed trial index to appease multitask models for prediction
+    by giving fixed features. This is not necessarily accurate and should eventually
+    come from the generation strategy.
+    """
+    observed_trial_indices = [
+        obs.features.trial_index
+        for obs in model.get_training_data()
+        if obs.features.trial_index is not None
+    ]
+    if len(observed_trial_indices) == 0:
+        return None
+    return max(observed_trial_indices)
+
+
+def _get_model(
+    experiment: Experiment,
+    generation_strategy: GenerationStrategyInterface | None,
+    use_modeled_effects: bool,
+    trial_index: int,
+    metric_name: str,
+) -> ModelBridge:
+    """Get a model for predictions.
+
+    Args:
+        experiment: Used to get the data for the model.
+        generation_strategy: Used to get the model if we want to use modeled effects
+            and the current model is predictive.
+        use_modeled_effects: Whether to use modeled effects.
+        trial_index: The trial index to get data for in training the model.
+        metric_name: The name of the metric we're plotting, which we validate has
+            data on the trial.
+
+    Returns:
+        If use_modeled_effects is False, returns a Thompson model, which just predicts
+        from the data.
+        If use_modeled_effects is True, returns the current model on the generation
+        strategy if it is predictive.  Otherwise, returns an empirical Bayes model.
+    """
+    trial_data = experiment.lookup_data(trial_indices=[trial_index])
+    if trial_data.filter(metric_names=[metric_name]).df.empty:
+        raise DataRequiredError(
+            f"Cannot plot effects for '{metric_name}' on trial {trial_index} "
+            "because it has no data.  Either the data is not available yet, "
+            "or we encountered an error fetching it."
+        )
+    if use_modeled_effects:
+        model = None
+        if isinstance(generation_strategy, GenerationStrategy):
+            if generation_strategy.model is None:
+                generation_strategy._fit_current_model(data=experiment.lookup_data())
+
+            model = none_throws(generation_strategy.model)
+
+        if model is None or not is_predictive(model=model):
+            logger.info("Using empirical Bayes for predictions.")
+            return Models.EMPIRICAL_BAYES_THOMPSON(
+                experiment=experiment, data=trial_data
+            )
+
+        return model
+    else:
+        # This model just predicts raw data
+        return Models.THOMPSON(
+            data=trial_data,
+            search_space=experiment.search_space,
+            experiment=experiment,
+        )
+
+
+def _prepare_data(
+    experiment: Experiment,
+    model: ModelBridge,
+    outcome_constraints: list[OutcomeConstraint],
+    metric_name: str,
+    trial_index: int,
+    use_modeled_effects: bool,
+) -> pd.DataFrame:
+    """Prepare data for plotting.  Data should include columns for:
+    - source: In-sample or model key that geneerated the candidate
+    - arm_name: Name of the arm
+    - mean: Predicted metric value
+    - error_margin: 1.96 * predicted sem for plotting 95% CI
+    - **PARAMETER_NAME: The value of each parameter for the arm.  Will be used
+        for the tooltip.
+    There will be one row for each arm in the model's training data and one for
+    each arm in the generator runs of the candidate trial.  If an arm is in both
+    the training data and the candidate trial, it will only appear once for the
+    candidate trial.
+
+    Args:
+        experiment: Experiment to plot
+        model: ModelBridge being used for prediction
+        outcome_constraints: Derelatives outcome constraints used for
+            assessing feasibility
+        metric_name: Name of metric to plot
+        trial_index: Optional trial index to plot.  If not specified, will
+            plot the most recent non-abandoned trial with all observations.
+    """
+    try:
+        trial = experiment.trials[trial_index]
+    except KeyError:
+        raise UserInputError(
+            f"Cannot plot effects for {trial_index} because "
+            f"it's missing from {experiment}."
+        )
+
+    status_quo_prediction = (
+        []
+        if experiment.status_quo is None
+        else [
+            get_predictions_by_arm(
+                model=model,
+                metric_name=metric_name,
+                outcome_constraints=outcome_constraints,
+                gr=GeneratorRun(
+                    arms=[experiment.status_quo],
+                    model_key="Status Quo",
+                ),
+            )
+        ]
+    )
+    trial_predictions = [
+        get_predictions_by_arm(
+            model=model,
+            metric_name=metric_name,
+            outcome_constraints=outcome_constraints,
+            gr=gr,
+        )
+        for gr in trial.generator_runs
+    ]
+
+    df = pd.DataFrame.from_records(
+        list(
+            chain(
+                *[
+                    *trial_predictions,
+                    *status_quo_prediction,
+                ]
+            )
+        )
+    )
+    df.drop_duplicates(subset="arm_name", keep="last", inplace=True)
+    return df