Source code for ax.modelbridge.generation_strategy

#!/usr/bin/env python3
# Copyright (c) Meta Platforms, Inc. and affiliates.
#
# This source code is licensed under the MIT license found in the
# LICENSE file in the root directory of this source tree.

# pyre-strict

from __future__ import annotations

from collections.abc import Callable

from copy import deepcopy
from functools import wraps
from logging import Logger
from typing import Any, TypeVar

import pandas as pd
from ax.core.data import Data
from ax.core.experiment import Experiment
from ax.core.generation_strategy_interface import GenerationStrategyInterface
from ax.core.generator_run import GeneratorRun
from ax.core.observation import ObservationFeatures
from ax.core.utils import extend_pending_observations, extract_pending_observations
from ax.exceptions.core import DataRequiredError, UnsupportedError, UserInputError
from ax.exceptions.generation_strategy import (
    GenerationStrategyCompleted,
    GenerationStrategyMisconfiguredException,
)
from ax.modelbridge.base import ModelBridge
from ax.modelbridge.generation_node import GenerationNode, GenerationStep
from ax.modelbridge.generation_node_input_constructors import InputConstructorPurpose
from ax.modelbridge.model_spec import FactoryFunctionModelSpec
from ax.modelbridge.transition_criterion import TrialBasedCriterion
from ax.utils.common.logger import _round_floats_for_logging, get_logger
from ax.utils.common.typeutils import checked_cast_list
from pyre_extensions import none_throws

logger: Logger = get_logger(__name__)


MAX_CONDITIONS_GENERATED = 10000
MAX_GEN_DRAWS = 5
MAX_GEN_DRAWS_EXCEEDED_MESSAGE = (
    f"GenerationStrategy exceeded `MAX_GEN_DRAWS` of {MAX_GEN_DRAWS} while trying to "
    "generate a unique parameterization. This indicates that the search space has "
    "likely been fully explored, or that the sweep has converged."
)
T = TypeVar("T")



[docs]
def step_based_gs_only(f: Callable[..., T]) -> Callable[..., T]:
    """
    For use as a decorator on functions only implemented for ``GenerationStep``-based
    ``GenerationStrategies``. Mainly useful for older ``GenerationStrategies``.
    """

    @wraps(f)
    def impl(self: GenerationStrategy, *args: list[Any], **kwargs: dict[str, Any]) -> T:
        if self.is_node_based:
            raise UnsupportedError(
                f"{f.__name__} is not supported for GenerationNode based"
                " GenerationStrategies."
            )
        return f(self, *args, **kwargs)

    return impl




[docs]
class GenerationStrategy(GenerationStrategyInterface):
    """GenerationStrategy describes which model should be used to generate new
    points for which trials, enabling and automating use of different models
    throughout the optimization process. For instance, it allows to use one
    model for the initialization trials, and another one for all subsequent
    trials. In the general case, this allows to automate use of an arbitrary
    number of models to generate an arbitrary numbers of trials
    described in the `trials_per_model` argument.

    Args:
        nodes: A list of `GenerationNode`. Each `GenerationNode` in the list
            represents a single node in a `GenerationStrategy` which, when
            composed of `GenerationNodes`, can be conceptualized as a graph instead
            of a linear list. `TransitionCriterion` defined in each `GenerationNode`
            represent the edges in the `GenerationStrategy` graph. `GenerationNodes`
            are more flexible than `GenerationSteps` and new `GenerationStrategies`
            should use nodes. Notably, either, but not both, of `nodes` and `steps`
            must be provided.
        steps: A list of `GenerationStep` describing steps of this strategy.
        name: An optional name for this generation strategy. If not specified,
            strategy's name will be names of its nodes' models joined with '+'.
    """

    _nodes: list[GenerationNode]
    _curr: GenerationNode  # Current node in the strategy.
    # Whether all models in this GS are in Models registry enum.
    _uses_registered_models: bool
    # All generator runs created through this generation strategy, in chronological
    # order.
    _generator_runs: list[GeneratorRun]
    # Experiment, for which this generation strategy has generated trials, if
    # it exists.
    _experiment: Experiment | None = None
    _model: ModelBridge | None = None  # Current model.

    def __init__(
        self,
        steps: list[GenerationStep] | None = None,
        name: str | None = None,
        nodes: list[GenerationNode] | None = None,
    ) -> None:
        # Validate that one and only one of steps or nodes is provided
        if not ((steps is None) ^ (nodes is None)):
            raise GenerationStrategyMisconfiguredException(
                error_info="GenerationStrategy must contain either steps or nodes."
            )

        # pyre-ignore[8]
        self._nodes = none_throws(nodes if steps is None else steps)

        # Validate correctness of steps list or nodes graph
        if isinstance(steps, list) and all(
            isinstance(s, GenerationStep) for s in steps
        ):
            self._validate_and_set_step_sequence(steps=self._nodes)
        elif isinstance(nodes, list) and self.is_node_based:
            self._validate_and_set_node_graph(nodes=nodes)
        else:
            # TODO[mgarrard]: Allow mix of nodes and steps
            raise GenerationStrategyMisconfiguredException(
                "`GenerationStrategy` inputs are:\n"
                "`steps` (list of `GenerationStep`) or\n"
                "`nodes` (list of `GenerationNode`)."
            )

        # Log warning if the GS uses a non-registered (factory function) model.
        self._uses_registered_models = not any(
            isinstance(ms, FactoryFunctionModelSpec)
            for node in self._nodes
            for ms in node.model_specs
        )
        if not self._uses_registered_models:
            logger.info(
                "Using model via callable function, "
                "so optimization is not resumable if interrupted."
            )
        self._generator_runs = []
        # Set name to an explicit value ahead of time to avoid
        # adding properties during equality checks
        super().__init__(name=name or self._make_default_name())

    @property
    def is_node_based(self) -> bool:
        """Whether this strategy consists of GenerationNodes only.
        This is useful for determining initialization properties and
        other logic.
        """
        return not any(isinstance(n, GenerationStep) for n in self._nodes) and all(
            isinstance(n, GenerationNode) for n in self._nodes
        )

    @property
    def nodes_dict(self) -> dict[str, GenerationNode]:
        """Returns a dictionary mapping node names to nodes."""
        return {node.node_name: node for node in self._nodes}

    @property
    def name(self) -> str:
        """Name of this generation strategy. Defaults to a combination of model
        names provided in generation steps, set at the time of the
        ``GenerationStrategy`` creation.
        """
        return self._name

    @name.setter
    def name(self, name: str) -> None:
        """Set generation strategy name."""
        self._name = name

    @property
    @step_based_gs_only
    def model_transitions(self) -> list[int]:
        """[DEPRECATED]List of trial indices where a transition happened from one model
        to another.
        """
        raise DeprecationWarning(
            "`model_transitions` is no longer supported. Please refer to `model_key` "
            "field on generator runs for similar information if needed."
        )

    @property
    def current_step(self) -> GenerationStep:
        """Current generation step."""
        if not isinstance(self._curr, GenerationStep):
            raise TypeError(
                "The current object is not a GenerationStep, you may be looking "
                "for the current_node property."
            )
        return self._curr

    @property
    def current_node(self) -> GenerationNode:
        """Current generation node."""
        if not isinstance(self._curr, GenerationNode):
            raise TypeError(
                "The current object is not a GenerationNode, you may be looking for the"
                " current_step property."
            )
        return self._curr

    @property
    def current_node_name(self) -> str:
        """Current generation node name."""
        return self._curr.node_name

    @property
    @step_based_gs_only
    def current_step_index(self) -> int:
        """Returns the index of the current generation step. This attribute
        is replaced by node_name in newer GenerationStrategies but surfaced here
        for backward compatibility.
        """
        node_names_for_all_steps = [step._node_name for step in self._nodes]
        assert (
            self._curr.node_name in node_names_for_all_steps
        ), "The current step is not found in the list of steps"

        return node_names_for_all_steps.index(self._curr.node_name)

    @property
    def model(self) -> ModelBridge | None:
        """Current model in this strategy. Returns None if no model has been set
        yet (i.e., if no generator runs have been produced from this GS).
        """
        return self._curr._fitted_model

    @property
    def experiment(self) -> Experiment:
        """Experiment, currently set on this generation strategy."""
        if self._experiment is None:
            raise ValueError("No experiment set on generation strategy.")
        return none_throws(self._experiment)

    @experiment.setter
    def experiment(self, experiment: Experiment) -> None:
        """If there is an experiment set on this generation strategy as the
        experiment it has been generating generator runs for, check if the
        experiment passed in is the same as the one saved and log an information
        statement if its not. Set the new experiment on this generation strategy.
        """
        if self._experiment is None or experiment._name == self.experiment._name:
            self._experiment = experiment
        else:
            raise ValueError(
                "This generation strategy has been used for experiment "
                f"{self.experiment._name} so far; cannot reset experiment"
                f" to {experiment._name}. If this is a new optimization, "
                "a new generation strategy should be created instead."
            )

    @property
    def last_generator_run(self) -> GeneratorRun | None:
        """Latest generator run produced by this generation strategy.
        Returns None if no generator runs have been produced yet.
        """
        # Used to restore current model when decoding a serialized GS.
        return self._generator_runs[-1] if self._generator_runs else None

    @property
    def uses_non_registered_models(self) -> bool:
        """Whether this generation strategy involves models that are not
        registered and therefore cannot be stored."""
        return not self._uses_registered_models

    @property
    def trials_as_df(self) -> pd.DataFrame | None:
        """Puts information on individual trials into a data frame for easy
        viewing.

        For example for a GenerationStrategy composed of GenerationSteps:
        Gen. Step | Models   | Trial Index | Trial Status | Arm Parameterizations
        [0]       | [Sobol]  | 0           | RUNNING      | {"0_0":{"x":9.17...}}
        """
        logger.info(
            "Note that parameter values in dataframe are rounded to 2 decimal "
            "points; the values in the dataframe are thus not the exact ones "
            "suggested by Ax in trials."
        )
        if self._experiment is None or len(self.experiment.trials) == 0:
            return None

        step_or_node_col = (
            "Generation Nodes" if self.is_node_based else "Generation Step"
        )
        records = [
            {
                step_or_node_col: [
                    (
                        gr._generation_node_name
                        if gr.generator_run_type != "MANUAL"
                        else "MANUAL"
                    )
                    for gr in trial.generator_runs
                ],
                "Generation Model(s)": [
                    (gr._model_key if gr.generator_run_type != "MANUAL" else "MANUAL")
                    for gr in trial.generator_runs
                ],
                "Trial Index": trial_idx,
                "Trial Status": trial.status.name,
                "Arm Parameterizations": {
                    arm.name: _round_floats_for_logging(arm.parameters)
                    for arm in trial.arms
                },
            }
            for trial_idx, trial in self.experiment.trials.items()
        ]

        return pd.DataFrame.from_records(records).reindex(
            columns=[
                step_or_node_col,
                "Generation Model(s)",
                "Trial Index",
                "Trial Status",
                "Arm Parameterizations",
            ]
        )

    @property
    def optimization_complete(self) -> bool:
        """Checks whether all nodes are completed in the generation strategy."""
        return all(node.is_completed for node in self._nodes)

    @property
    @step_based_gs_only
    def _steps(self) -> list[GenerationStep]:
        """List of generation steps."""
        return self._nodes  # pyre-ignore[7]


[docs]
    def gen(
        self,
        experiment: Experiment,
        data: Data | None = None,
        n: int = 1,
        pending_observations: dict[str, list[ObservationFeatures]] | None = None,
        **kwargs: Any,
    ) -> GeneratorRun:
        """Produce the next points in the experiment. Additional kwargs passed to
        this method are propagated directly to the underlying model's `gen`, along
        with the `model_gen_kwargs` set on the current generation node.

        NOTE: Each generator run returned from this function must become a single
        trial on the experiment to comply with assumptions made in generation
        strategy. Do not split one generator run produced from generation strategy
        into multiple trials (never making a generator run into a trial is allowed).

        Args:
            experiment: Experiment, for which the generation strategy is producing
                a new generator run in the course of `gen`, and to which that
                generator run will be added as trial(s). Information stored on the
                experiment (e.g., trial statuses) is used to determine which model
                will be used to produce the generator run returned from this method.
            data: Optional data to be passed to the underlying model's `gen`, which
                is called within this method and actually produces the resulting
                generator run. By default, data is all data on the `experiment`.
            n: Integer representing how many arms should be in the generator run
                produced by this method. NOTE: Some underlying models may ignore
                the `n` and produce a model-determined number of arms. In that
                case this method will also output a generator run with number of
                arms that can differ from `n`.
            pending_observations: A map from metric name to pending
                observations for that metric, used by some models to avoid
                resuggesting points that are currently being evaluated.
        """
        return self._gen_multiple(
            experiment=experiment,
            num_generator_runs=1,
            data=data,
            n=n,
            pending_observations=pending_observations,
            **kwargs,
        )[0]



[docs]
    def gen_with_multiple_nodes(
        self,
        experiment: Experiment,
        data: Data | None = None,
        pending_observations: dict[str, list[ObservationFeatures]] | None = None,
        n: int | None = None,
        fixed_features: ObservationFeatures | None = None,
        arms_per_node: dict[str, int] | None = None,
    ) -> list[GeneratorRun]:
        """Produces a List of GeneratorRuns for a single trial, either ``Trial`` or
        ``BatchTrial``, and if producing a ``BatchTrial`` allows for multiple
        models to be used to generate GeneratorRuns for that trial.

        NOTE: This method is in development.  Please do not use it yet.

        Args:
            experiment: Experiment, for which the generation strategy is producing
                a new generator run in the course of `gen`, and to which that
                generator run will be added as trial(s). Information stored on the
                experiment (e.g., trial statuses) is used to determine which model
                will be used to produce the generator run returned from this method.
            data: Optional data to be passed to the underlying model's `gen`, which
                is called within this method and actually produces the resulting
                generator run. By default, data is all data on the `experiment`.
            pending_observations: A map from metric name to pending
                observations for that metric, used by some models to avoid
                resuggesting points that are currently being evaluated.
            n: Integer representing how many arms should be in the generator run
                produced by this method. NOTE: Some underlying models may ignore
                the `n` and produce a model-determined number of arms. In that
                case this method will also output a generator run with number of
                arms that can differ from `n`.
            fixed_features: An optional set of ``ObservationFeatures`` that will be
                passed down to the underlying models. Note: if provided this will
                override any algorithmically determined fixed features so it is
                important to specify all necessary fixed features.
            arms_per_node: An optional map from node name to the number of arms to
                generate from that node. If not provided, will default to the number
                of arms specified in the node's ``InputConstructors`` or n if no
                ``InputConstructors`` are defined on the node. We expect either n or
                arms_per_node to be provided, but not both, and this is an advanced
                argument that should only be used by advanced users.

        Returns:
            A list of ``GeneratorRuns`` for a single trial.
        """
        # TODO: @mgarrard merge into gen method, just starting here to derisk
        grs = []
        continue_gen_for_trial = True
        pending_observations = deepcopy(pending_observations) or {}
        self.experiment = experiment
        self._validate_arms_per_node(arms_per_node=arms_per_node)
        # TODO: @mgarrard update this when gen methods are merged
        gen_kwargs: dict[str, Any] = {}
        gen_kwargs = {
            "experiment": experiment,
            "data": data,
            "pending_observations": pending_observations,
            "grs_this_gen": grs,
            "n": n,
        }

        while continue_gen_for_trial:
            gen_kwargs["grs_this_gen"] = grs
            should_transition, node_to_gen_from_name = (
                self._curr.should_transition_to_next_node(
                    raise_data_required_error=False
                )
            )
            node_to_gen_from = self.nodes_dict[node_to_gen_from_name]
            if should_transition:
                node_to_gen_from._previous_node_name = node_to_gen_from_name
                # reset should skip as conditions may have changed, do not reset
                # until now so node properites can be as up to date as possible
                node_to_gen_from._should_skip = False
            arms_from_node = self._determine_arms_from_node(
                node_to_gen_from=node_to_gen_from,
                arms_per_node=arms_per_node,
                n=n,
                gen_kwargs=gen_kwargs,
            )
            fixed_features_from_node = self._determine_fixed_features_from_node(
                node_to_gen_from=node_to_gen_from,
                gen_kwargs=gen_kwargs,
                passed_fixed_features=fixed_features,
            )
            sq_ft_from_node = self._determine_sq_features_from_node(
                node_to_gen_from=node_to_gen_from, gen_kwargs=gen_kwargs
            )
            # TODO: @mgarrard clean this up after gens merge. This is currently needed
            # because the actual transition occurs in gs.gen(), but if a node is
            # skipped, we need to transition here to actually initiate that transition
            if node_to_gen_from._should_skip:
                self._maybe_transition_to_next_node()
                continue
            if arms_from_node != 0:
                grs.extend(
                    self._gen_multiple(
                        experiment=experiment,
                        num_generator_runs=1,
                        data=data,
                        n=arms_from_node,
                        pending_observations=pending_observations,
                        fixed_features=fixed_features_from_node,
                        status_quo_features=sq_ft_from_node,
                    )
                )
                # ensure that the points generated from each node are marked as pending
                # points for future calls to gen
                pending_observations = extend_pending_observations(
                    experiment=experiment,
                    pending_observations=pending_observations,
                    # only pass in the most recent generator run to avoid unnecessary
                    # deduplication in extend_pending_observations
                    generator_runs=[grs[-1]],
                )
            continue_gen_for_trial = self._should_continue_gen_for_trial()
        return grs



[docs]
    def gen_for_multiple_trials_with_multiple_models(
        self,
        experiment: Experiment,
        data: Data | None = None,
        pending_observations: dict[str, list[ObservationFeatures]] | None = None,
        n: int | None = None,
        fixed_features: ObservationFeatures | None = None,
        num_trials: int = 1,
        arms_per_node: dict[str, int] | None = None,
    ) -> list[list[GeneratorRun]]:
        """Produce GeneratorRuns for multiple trials at once with the possibility of
        using multiple models per trial, getting multiple GeneratorRuns per trial.

        Args:
            experiment: ``Experiment``, for which the generation strategy is producing
                a new generator run in the course of ``gen``, and to which that
                generator run will be added as trial(s). Information stored on the
                experiment (e.g., trial statuses) is used to determine which model
                will be used to produce the generator run returned from this method.
            data: Optional data to be passed to the underlying model's ``gen``, which
                is called within this method and actually produces the resulting
                generator run. By default, data is all data on the ``experiment``.
            pending_observations: A map from metric name to pending
                observations for that metric, used by some models to avoid
                resuggesting points that are currently being evaluated.
            n: Integer representing how many total arms should be in the generator
                runs produced by this method. NOTE: Some underlying models may ignore
                the `n` and produce a model-determined number of arms. In that
                case this method will also output generator runs with number of
                arms that can differ from `n`.
            fixed_features: An optional set of ``ObservationFeatures`` that will be
                passed down to the underlying models. Note: if provided this will
                override any algorithmically determined fixed features so it is
                important to specify all necessary fixed features.
            num_trials: Number of trials to generate generator runs for in this call.
                If not provided, defaults to 1.
            arms_per_node: An optional map from node name to the number of arms to
                generate from that node. If not provided, will default to the number
                of arms specified in the node's ``InputConstructors`` or n if no
                ``InputConstructors`` are defined on the node. We expect either n or
                arms_per_node to be provided, but not both, and this is an advanced
                argument that should only be used by advanced users.

        Returns:
            A list of lists of lists generator runs. Each outer list represents
            a trial being suggested and  each inner list represents a generator
            run for that trial.
        """
        trial_grs = []
        pending_observations = (
            extract_pending_observations(experiment=experiment) or {}
            if pending_observations is None
            else deepcopy(pending_observations)
        )
        gr_limit = self._curr.generator_run_limit(raise_generation_errors=False)
        if gr_limit == -1:
            num_trials = max(num_trials, 1)
        else:
            num_trials = max(min(num_trials, gr_limit), 1)
        for _i in range(num_trials):
            trial_grs.append(
                self.gen_with_multiple_nodes(
                    experiment=experiment,
                    data=data,
                    n=n,
                    pending_observations=pending_observations,
                    arms_per_node=arms_per_node,
                    fixed_features=fixed_features,
                )
            )

            extend_pending_observations(
                experiment=experiment,
                pending_observations=pending_observations,
                # pass in the most recently generated grs each time to avoid
                # duplication
                generator_runs=trial_grs[-1],
            )
        return trial_grs



[docs]
    def current_generator_run_limit(
        self,
    ) -> tuple[int, bool]:
        """First check if we can move the generation strategy to the next node, which
        is safe, as the next call to ``gen`` will just pick up from there. Then
        determine how many generator runs this generation strategy can generate right
        now, assuming each one of them becomes its own trial, and whether optimization
        is completed.

        Returns: a two-item tuple of:
              - the number of generator runs that can currently be produced, with -1
                meaning unlimited generator runs,
              - whether optimization is completed and the generation strategy cannot
                generate any more generator runs at all.
        """
        try:
            self._maybe_transition_to_next_node(raise_data_required_error=False)
        except GenerationStrategyCompleted:
            return 0, True

        # if the generation strategy is not complete, optimization is not complete
        return self._curr.generator_run_limit(), False



[docs]
    def clone_reset(self) -> GenerationStrategy:
        """Copy this generation strategy without it's state."""
        cloned_nodes = deepcopy(self._nodes)
        for n in cloned_nodes:
            # Unset the generation strategy back-pointer, so the nodes are not
            # associated with any generation strategy.
            n._generation_strategy = None
        if self.is_node_based:
            return GenerationStrategy(name=self.name, nodes=cloned_nodes)

        return GenerationStrategy(
            name=self.name, steps=checked_cast_list(GenerationStep, cloned_nodes)
        )


    def _unset_non_persistent_state_fields(self) -> None:
        """Utility for testing convenience: unset fields of generation strategy
        that are set during candidate generation; these fields are not persisted
        during storage. To compare a pre-storage and a reloaded generation
        strategies; call this utility on the pre-storage one first. The rest
        of the fields should be identical.
        """
        self._model = None
        for s in self._nodes:
            s._model_spec_to_gen_from = None
            if not self.is_node_based:
                s._previous_node_name = None

    @step_based_gs_only
    def _validate_and_set_step_sequence(self, steps: list[GenerationStep]) -> None:
        """Initialize and validate the steps provided to this GenerationStrategy.

        Some GenerationStrategies are composed of GenerationStep objects, but we also
        need to initialize the correct GenerationNode representation for these steps.
        This function validates:
            1. That only the last step has num_trials=-1, which indicates unlimited
               trial generation is possible.
            2. That each step's num_trials attribute is either positive or -1
            3. That each step's max_parallelism attribute is either None or positive
        It then sets the correct TransitionCriterion and node_name attributes on the
        underlying GenerationNode objects.
        """
        for idx, step in enumerate(steps):
            if step.num_trials == -1 and len(step.completion_criteria) < 1:
                if idx < len(self._steps) - 1:
                    raise UserInputError(
                        "Only last step in generation strategy can have "
                        "`num_trials` set to -1 to indicate that the model in "
                        "the step should be used to generate new trials "
                        "indefinitely unless completion criteria present."
                    )
            elif step.num_trials < 1 and step.num_trials != -1:
                raise UserInputError(
                    "`num_trials` must be positive or -1 (indicating unlimited) "
                    "for all generation steps."
                )
            if step.max_parallelism is not None and step.max_parallelism < 1:
                raise UserInputError(
                    "Maximum parallelism should be None (if no limit) or "
                    f"a positive number. Got: {step.max_parallelism} for "
                    f"step {step.model_name}."
                )

            step._node_name = f"GenerationStep_{str(idx)}"
            step.index = idx

            # Set transition_to field for all but the last step, which remains
            # null.
            if idx != len(self._steps):
                for transition_criteria in step.transition_criteria:
                    if (
                        transition_criteria.criterion_class
                        != "MaxGenerationParallelism"
                    ):
                        transition_criteria._transition_to = (
                            f"GenerationStep_{str(idx + 1)}"
                        )
            step._generation_strategy = self
        self._curr = steps[0]

    def _validate_and_set_node_graph(self, nodes: list[GenerationNode]) -> None:
        """Initialize and validate the node graph provided to this GenerationStrategy.

        This function validates:
            1. That all nodes have unique names.
            2. That there is at least one node with a transition_to field.
            3. That all `transition_to` attributes on a TransitionCriterion point to
                another node in the same GenerationStrategy.
            4. Warns if no nodes contain a transition criterion
        """
        node_names = []
        for node in self._nodes:
            # validate that all node names are unique
            if node.node_name in node_names:
                raise GenerationStrategyMisconfiguredException(
                    error_info="All node names in a GenerationStrategy "
                    + "must be unique."
                )

            node_names.append(node.node_name)
            node._generation_strategy = self

        # Validate that the next_node is in the ``GenerationStrategy`` and that all
        # TCs in one "transition edge" (so all TCs from one node to another) have the
        # same `continue_trial_generation` setting. Since multiple TCs together
        # constitute one "transition edge", not having all TCs on such an "edge"
        # indicate the same resulting state (continuing generation for same trial
        # vs. stopping it after generating from current node) would indicate a
        # malformed generation node DAG definition and therefore a
        # malformed ``GenerationStrategy``.
        contains_a_transition_to_argument = False
        for node in self._nodes:
            for next_node, tcs in node.transition_edges.items():
                contains_a_transition_to_argument = True
                if next_node is None:
                    # TODO: @mgarrard remove MaxGenerationParallelism check when
                    # we update TransitionCriterion always define `transition_to`
                    for tc in tcs:
                        if "MaxGenerationParallelism" not in tc.criterion_class:
                            raise GenerationStrategyMisconfiguredException(
                                error_info="Only MaxGenerationParallelism transition"
                                " criterion can have a null `transition_to` argument,"
                                f" but {tc.criterion_class} does not define "
                                f"`transition_to` on {node.node_name}."
                            )
                if next_node is not None and next_node not in node_names:
                    raise GenerationStrategyMisconfiguredException(
                        error_info=f"`transition_to` argument "
                        f"{next_node} does not correspond to any node in"
                        " this GenerationStrategy."
                    )
                if (
                    next_node is not None
                    and len({tc.continue_trial_generation for tc in tcs}) > 1
                ):
                    raise GenerationStrategyMisconfiguredException(
                        error_info=f"All transition criteria on an edge "
                        f"from node {node.node_name} to node {next_node} "
                        "should have the same `continue_trial_generation` "
                        "setting."
                    )

        # validate that at least one node has transition_to field
        if len(self._nodes) > 1 and not contains_a_transition_to_argument:
            logger.warning(
                "None of the nodes in this GenerationStrategy "
                "contain a `transition_to` argument in their transition_criteria. "
                "Therefore, the GenerationStrategy will not be able to "
                "move from one node to another. Please add a "
                "`transition_to` argument."
            )
        self._curr = nodes[0]

    @step_based_gs_only
    def _step_repr(self, step_str_rep: str) -> str:
        """Return the string representation of the steps in a GenerationStrategy
        composed of GenerationSteps.
        """
        step_str_rep += "steps=["
        remaining_trials = "subsequent" if len(self._nodes) > 1 else "all"
        for step in self._nodes:
            num_trials = remaining_trials
            for criterion in step.transition_criteria:
                if criterion.criterion_class == "MaxTrials" and isinstance(
                    criterion, TrialBasedCriterion
                ):
                    num_trials = criterion.threshold

            try:
                model_name = step.model_spec_to_gen_from.model_key
            except TypeError:
                model_name = "model with unknown name"

            step_str_rep += f"{model_name} for {num_trials} trials, "
        step_str_rep = step_str_rep[:-2]
        step_str_rep += "])"
        return step_str_rep

    def _validate_arms_per_node(self, arms_per_node: dict[str, int] | None) -> None:
        """Validate that the arms_per_node argument is valid if it is provided.

        Args:
            arms_per_node: A map from node name to the number of arms to
                generate from that node.
        """
        if arms_per_node is not None and not set(self.nodes_dict).issubset(
            arms_per_node
        ):
            raise UserInputError(
                f"""
                Each node defined in the GenerationStrategy must have an associated
                number of arms to generate from that node defined in `arms_per_node`.
                {arms_per_node} does not include all of {self.nodes_dict.keys()}. It
                may be helpful to double check the spelling.
                """
            )

    def _make_default_name(self) -> str:
        """Make a default name for this generation strategy; used when no name is passed
        to the constructor. For node-based generation strategies, the name is
        constructed by joining together the names of the nodes set on this
        generation strategy. For step-based generation strategies, the model keys
        of the underlying model specs are used.
        Note: This should only be called once the nodes are set.
        """
        if not self._nodes:
            raise UnsupportedError(
                "Cannot make a default name for a generation strategy with no nodes "
                "set yet."
            )
        # TODO: Simplify this after updating GStep names to represent underlying models.
        if self.is_node_based:
            node_names = (node.node_name for node in self._nodes)
        else:
            node_names = (node.model_spec_to_gen_from.model_key for node in self._nodes)
            # Trim the "get_" beginning of the factory function if it's there.
            node_names = (n[4:] if n[:4] == "get_" else n for n in node_names)
        return "+".join(node_names)

    def __repr__(self) -> str:
        """String representation of this generation strategy."""
        gs_str = f"GenerationStrategy(name='{self.name}', "
        if not self.is_node_based:
            return self._step_repr(gs_str)
        gs_str += f"nodes={str(self._nodes)})"
        return gs_str

    # ------------------------- Candidate generation helpers. -------------------------

    def _gen_multiple(
        self,
        experiment: Experiment,
        num_generator_runs: int,
        data: Data | None = None,
        n: int = 1,
        pending_observations: dict[str, list[ObservationFeatures]] | None = None,
        status_quo_features: ObservationFeatures | None = None,
        **model_gen_kwargs: Any,
    ) -> list[GeneratorRun]:
        """Produce multiple generator runs at once, to be made into multiple
        trials on the experiment.

        NOTE: This is used to ensure that maximum parallelism and number
        of trials per node are not violated when producing many generator
        runs from this generation strategy in a row. Without this function,
        if one generates multiple generator runs without first making any
        of them into running trials, generation strategy cannot enforce that it only
        produces as many generator runs as are allowed by the parallelism
        limit and the limit on number of trials in current node.

        Args:
            experiment: Experiment, for which the generation strategy is producing
                a new generator run in the course of `gen`, and to which that
                generator run will be added as trial(s). Information stored on the
                experiment (e.g., trial statuses) is used to determine which model
                will be used to produce the generator run returned from this method.
            data: Optional data to be passed to the underlying model's `gen`, which
                is called within this method and actually produces the resulting
                generator run. By default, data is all data on the `experiment`.
            n: Integer representing how many arms should be in the generator run
                produced by this method. NOTE: Some underlying models may ignore
                the ``n`` and produce a model-determined number of arms. In that
                case this method will also output a generator run with number of
                arms that can differ from ``n``.
            pending_observations: A map from metric name to pending
                observations for that metric, used by some models to avoid
                resuggesting points that are currently being evaluated.
            model_gen_kwargs: Keyword arguments that are passed through to
                ``GenerationNode.gen``, which will pass them through to
                ``ModelSpec.gen``, which will pass them to ``ModelBridge.gen``.
            status_quo_features: An ``ObservationFeature`` of the status quo arm,
                needed by some models during fit to accomadate relative constraints.
                Includes the status quo parameterization and target trial index.
        """
        self.experiment = experiment
        self._maybe_transition_to_next_node()
        self._fit_current_model(data=data, status_quo_features=status_quo_features)
        # Get GeneratorRun limit that respects the node's transition criterion that
        # affect the number of generator runs that can be produced.
        gr_limit = self._curr.generator_run_limit(raise_generation_errors=True)
        if gr_limit == -1:
            num_generator_runs = max(num_generator_runs, 1)
        else:
            num_generator_runs = max(min(num_generator_runs, gr_limit), 1)
        generator_runs = []
        pending_observations = deepcopy(pending_observations) or {}
        for _ in range(num_generator_runs):
            try:
                generator_run = self._curr.gen(
                    n=n,
                    pending_observations=pending_observations,
                    arms_by_signature_for_deduplication=(
                        experiment.arms_by_signature_for_deduplication
                    ),
                    **model_gen_kwargs,
                )

            except DataRequiredError as err:
                # Model needs more data, so we log the error and return
                # as many generator runs as we were able to produce, unless
                # no trials were produced at all (in which case its safe to raise).
                if len(generator_runs) == 0:
                    raise
                logger.debug(f"Model required more data: {err}.")
                break

            self._generator_runs.append(generator_run)
            generator_runs.append(generator_run)

            # Extend the `pending_observation` with newly generated point(s)
            # to avoid repeating them.
            pending_observations = extend_pending_observations(
                experiment=experiment,
                pending_observations=pending_observations,
                generator_runs=[generator_run],
            )
        return generator_runs

    def _should_continue_gen_for_trial(self) -> bool:
        """Determine if we should continue generating for the current trial, or end
        generation for the current trial. Note that generating more would involve
        transitioning to a next node, because each node generates once per call to
        ``GenerationStrategy.gen_with_multiple_nodes``.

        Returns:
            A boolean which represents if generation for a trial is complete
        """
        should_transition, next_node = self._curr.should_transition_to_next_node(
            raise_data_required_error=False
        )
        # if we should not transition nodes, we should stop generation for this trial.
        if not should_transition:
            return False

        # if we will transition nodes, check if the transition criterion which define
        # the transition from this node to the next node indicate that we should
        # continue generating in the same trial, otherwise end the generation.
        assert next_node is not None
        return all(
            tc.continue_trial_generation
            for tc in self._curr.transition_edges[next_node]
        )

    def _determine_fixed_features_from_node(
        self,
        node_to_gen_from: GenerationNode,
        gen_kwargs: dict[str, Any],
        passed_fixed_features: ObservationFeatures | None = None,
    ) -> ObservationFeatures | None:
        """Uses the ``InputConstructors`` on the node to determine the fixed features
        to pass into the model. If fixed_features are provided, the will take
        precedence over the fixed_features from the node.

        Args:
            node_to_gen_from: The node from which to generate from
            gen_kwargs: The kwargs passed to the ``GenerationStrategy``'s
                gen call.
            passed_fixed_features: The fixed features passed to the ``gen`` method if
                any.

        Returns:
            An object of ObservationFeatures that represents the fixed features to
            pass into the model.
        """
        # passed_fixed_features represents the fixed features that were passed by the
        # user to the gen method as overrides.
        if passed_fixed_features is not None:
            return passed_fixed_features

        node_fixed_features = None
        if (
            InputConstructorPurpose.FIXED_FEATURES
            in node_to_gen_from.input_constructors
        ):
            node_fixed_features = node_to_gen_from.input_constructors[
                InputConstructorPurpose.FIXED_FEATURES
            ](
                previous_node=node_to_gen_from.previous_node,
                next_node=node_to_gen_from,
                gs_gen_call_kwargs=gen_kwargs,
                experiment=self.experiment,
            )
        return node_fixed_features

    def _determine_sq_features_from_node(
        self,
        node_to_gen_from: GenerationNode,
        gen_kwargs: dict[str, Any],
    ) -> ObservationFeatures | None:
        """todo"""
        # TODO: @mgarrard to merge the input constructor logic into a single method
        node_sq_features = None
        if (
            InputConstructorPurpose.STATUS_QUO_FEATURES
            in node_to_gen_from.input_constructors
        ):
            node_sq_features = node_to_gen_from.input_constructors[
                InputConstructorPurpose.STATUS_QUO_FEATURES
            ](
                previous_node=node_to_gen_from.previous_node,
                next_node=node_to_gen_from,
                gs_gen_call_kwargs=gen_kwargs,
                experiment=self.experiment,
            )
        return node_sq_features

    def _determine_arms_from_node(
        self,
        node_to_gen_from: GenerationNode,
        gen_kwargs: dict[str, Any],
        n: int | None = None,
        arms_per_node: dict[str, int] | None = None,
    ) -> int:
        """Calculates the number of arms to generate from the node that will be used
        during generation.

        Args:
            n: Integer representing how many arms should be in the generator run
                produced by this method. NOTE: Some underlying models may ignore
                the `n` and produce a model-determined number of arms. In that
                case this method will also output a generator run with number of
                arms that can differ from `n`.
            node_to_gen_from: The node from which to generate from
            gen_kwargs: The kwargs passed to the ``GenerationStrategy``'s
                gen call.
            arms_per_node: An optional map from node name to the number of arms to
                generate from that node. If not provided, will default to the number
                of arms specified in the node's ``InputConstructors`` or n if no
                ``InputConstructors`` are defined on the node.

        Returns:
            The number of arms to generate from the node that will be used during this
            generation via ``_gen_multiple``.
        """
        if arms_per_node is not None:
            # arms_per_node provides a way to manually override input
            # constructors. This should be used with caution, and only
            # if you really know what you're doing. :)
            arms_from_node = arms_per_node[node_to_gen_from.node_name]
        elif InputConstructorPurpose.N not in node_to_gen_from.input_constructors:
            # if the node does not have an input constructor for N, then we
            # assume a default of generating n arms from this node.
            arms_from_node = n if n is not None else self.DEFAULT_N
        else:
            arms_from_node = node_to_gen_from.input_constructors[
                InputConstructorPurpose.N
            ](
                previous_node=node_to_gen_from.previous_node,
                next_node=node_to_gen_from,
                gs_gen_call_kwargs=gen_kwargs,
                experiment=self.experiment,
            )

        return arms_from_node

    # ------------------------- Model selection logic helpers. -------------------------

    def _fit_current_model(
        self,
        data: Data | None,
        status_quo_features: ObservationFeatures | None = None,
    ) -> None:
        """Fits or update the model on the current generation node (does not move
        between generation nodes).

        Args:
            data: Optional ``Data`` to fit or update with; if not specified, generation
                strategy will obtain the data via ``experiment.lookup_data``.
            status_quo_features: An ``ObservationFeature`` of the status quo arm,
                needed by some models during fit to accomadate relative constraints.
                Includes the status quo parameterization and target trial index.
        """
        data = self.experiment.lookup_data() if data is None else data

        # Only pass status_quo_features if not None to avoid errors
        # with ``ExternalGenerationNode``.
        if status_quo_features is not None:
            self._curr.fit(
                experiment=self.experiment,
                data=data,
                status_quo_features=status_quo_features,
            )
        else:
            self._curr.fit(
                experiment=self.experiment,
                data=data,
            )
        self._model = self._curr._fitted_model

    def _maybe_transition_to_next_node(
        self,
        raise_data_required_error: bool = True,
    ) -> bool:
        """Moves this generation strategy to next node if the current node is completed,
        and it is not the last node in this generation strategy. This method is safe to
        use both when generating candidates or simply checking how many generator runs
        (to be made into trials) can currently be produced.

        NOTE: this method raises ``GenerationStrategyCompleted`` error if the current
        generation node is complete, but it is also the last in generation strategy.

        Args:
            raise_data_required_error: Whether to raise ``DataRequiredError`` in the
                maybe_step_completed method in GenerationNode class.

        Returns:
            Whether generation strategy moved to the next node.
        """
        move_to_next_node, next_node = self._curr.should_transition_to_next_node(
            raise_data_required_error=raise_data_required_error
        )
        if move_to_next_node:
            if self.optimization_complete:
                raise GenerationStrategyCompleted(
                    f"Generation strategy {self} generated all the trials as "
                    "specified in its nodes."
                )
            if next_node is None:
                # If the last node did not specify which node to transition to,
                # move to the next node in the list.
                current_node_index = self._nodes.index(self._curr)
                next_node = self._nodes[current_node_index + 1].node_name
            for node in self._nodes:
                if node.node_name == next_node:
                    self._curr = node
                    # Moving to the next node also entails unsetting this GS's model
                    # (since new node's model will be initialized for the first time;
                    # this is done in `self._fit_current_model).
                    self._model = None
        return move_to_next_node
Ax

latest

Source code for ax.modelbridge.generation_strategy

Ax

Navigation

Related Topics