`declearn.main.utils.TrainingManager`

Class wrapping the logic for local training and evaluation rounds.

Source code in declearn/main/utils/_training.py

class TrainingManager:
    """Class wrapping the logic for local training and evaluation rounds."""

    # one too-many attribute; pylint: disable=too-many-instance-attributes

    def __init__(
        self,
        model: Model,
        optim: Optimizer,
        aggrg: Aggregator,
        train_data: Dataset,
        valid_data: Optional[Dataset] = None,
        metrics: Union[MetricSet, List[MetricInputType], None] = None,
        logger: Union[logging.Logger, str, None] = None,
        verbose: bool = True,
    ) -> None:
        """Instantiate the client-side training and evaluation process.

        Parameters
        ----------
        model: Model
            Model instance that needs training and/or evaluating.
        optim: Optimizer
            Optimizer instance that orchestrates training steps.
        aggrg: Aggregator
            Aggregator instance that is used to derive global model
            updates from peer-wise local ones.
        train_data: Dataset
            Dataset instance wrapping the local training dataset.
        valid_data: Dataset or None, default=None
            Dataset instance wrapping the local validation dataset.
            If None, use `train_data` in the evaluation rounds.
        metrics: MetricSet or list[MetricInputType] or None, default=None
            MetricSet instance or list of Metric instances and/or specs
            to wrap into one, defining evaluation metrics to compute in
            addition to the model's loss.
            If None, only compute and report the model's loss.
        logger: logging.Logger or str or None, default=None,
            Logger to use, or name of a logger to set up with
            `declearn.utils.get_logger`.
            If None, use `type(self).__name__`.
        verbose: bool, default=True
            Whether to display progress bars when running training
            and validation rounds.
        """
        # arguments serve modularity; pylint: disable=too-many-arguments
        self.model = model
        self.optim = optim
        self.aggrg = aggrg
        self.train_data = train_data
        self.valid_data = valid_data
        self.metrics = self._prepare_metrics(metrics)
        if not isinstance(logger, logging.Logger):
            logger = get_logger(logger or f"{type(self).__name__}")
        self.logger = logger
        self.verbose = verbose

    def _prepare_metrics(
        self,
        metrics: Union[MetricSet, List[MetricInputType], None],
    ) -> MetricSet:
        """Parse the `metrics` instantiation inputs into a MetricSet."""
        # Type-check and/or transform the inputs into a MetricSet instance.
        metrics = MetricSet.from_specs(metrics)
        # If a model loss metric is part of the set, remove it.
        for i, metric in enumerate(metrics.metrics):
            if metric.name == "loss":
                metrics.metrics.pop(i)
        # Add the wrapped model's loss to the metrics.
        loss = self._setup_loss_metric()
        metrics.metrics.append(loss)
        # Return the prepared object for assignment as `metrics` attribute.
        return metrics

    def _setup_loss_metric(
        self,
    ) -> Metric:
        """Return an ad-hoc Metric object to compute the model's loss."""
        loss_fn = self.model.loss_function

        # Write a custom, unregistered Metric subclass.
        class LossMetric(MeanMetric, register=False):
            """Ad hoc Metric wrapping a model's loss function."""

            name = "loss"

            def metric_func(
                self, y_true: np.ndarray, y_pred: np.ndarray
            ) -> np.ndarray:
                return loss_fn(y_true, y_pred)

        # Instantiate and return the ad-hoc loss metric.
        return LossMetric()

    def training_round(
        self,
        message: messaging.TrainRequest,
    ) -> Union[messaging.TrainReply, messaging.Error]:
        """Run a local training round.

        If an exception is raised during the local process, wrap it as
        an Error message instead of raising it.

        Parameters
        ----------
        message: TrainRequest
            Instructions from the server regarding the training round.

        Returns
        -------
        reply: TrainReply or Error
            Message wrapping results from the training round, or any
            error raised during it.
        """
        self.logger.info("Participating in training round %s", message.round_i)
        # Try running the training round; return the reply is successful.
        try:
            return self._training_round(message)
        # In case of failure, wrap the exception as an Error message.
        except Exception as exception:  # pylint: disable=broad-except
            self.logger.error(
                "Error encountered during training: %s.", exception
            )
            return messaging.Error(repr(exception))

    def _training_round(
        self,
        message: messaging.TrainRequest,
    ) -> messaging.TrainReply:
        """Backend to `training_round`, without exception capture hooks."""
        # Unpack and apply model weights and optimizer auxiliary variables.
        self.logger.info("Applying server updates to local objects.")
        if message.weights is None:
            start_weights = self.model.get_weights(trainable=True)
        else:
            start_weights = message.weights
            self.model.set_weights(start_weights, trainable=True)
        self.optim.process_aux_var(message.aux_var)
        self.optim.start_round()  # trigger loss regularizer's `on_round_start`
        # Train under instructed effort constraints.
        params = message.n_epoch, message.n_steps, message.timeout
        self.logger.info(
            "Training local model for %s epochs | %s steps | %s seconds.",
            *params,
        )
        effort = self.train_under_constraints(message.batches, *params)
        # Compute and preprocess model updates and collect auxiliary variables.
        self.logger.info("Packing local updates to be sent to the server.")
        updates = self.aggrg.prepare_for_sharing(
            updates=start_weights - self.model.get_weights(trainable=True),
            n_steps=int(effort["n_steps"]),
        )
        aux_var = self.optim.collect_aux_var()
        # Wrap them as a TrainReply together with effort metadata and return.
        return messaging.TrainReply(
            updates=updates,
            aux_var=aux_var,
            n_epoch=int(effort["n_epoch"]),
            n_steps=int(effort["n_steps"]),
            t_spent=round(effort["t_spent"], 3),
        )

    def train_under_constraints(
        self,
        batch_cfg: Dict[str, Any],
        n_epoch: Optional[int] = 1,
        n_steps: Optional[int] = None,
        timeout: Optional[int] = None,
    ) -> Dict[str, float]:
        """Run local SGD steps under effort constraints.

        This is the core backend to the `training_round` method,
        which further handles message parsing and passing, as well
        as exception catching.

        Parameters
        ----------
        batch_cfg: Dict[str, Any]
            Keyword arguments for `self.train_data.generate_batches`
            i.e. specifications of batches used in local SGD steps.
        n_epoch: int or None, default=1
            Maximum number of local training epochs to perform.
            May be overridden by `n_steps` or `timeout`.
        n_steps: int or None, default=None
            Maximum number of local training steps to perform.
            May be overridden by `n_epoch` or `timeout`.
        timeout: int or None, default=None
            Time (in seconds) beyond which to interrupt training,
            regardless of the actual number of steps taken (> 0).

        Returns
        -------
        effort: dict[str, float]
            Dictionary storing information on the computational
            effort effectively performed:
            * n_epoch: int
                Number of training epochs completed.
            * n_steps: int
                Number of training steps completed.
            * t_spent: float
                Time spent running training steps (in seconds).
        """
        # Set up effort constraints under which to operate.
        epochs = Constraint(limit=n_epoch, name="n_epoch")
        constraints = ConstraintSet(
            Constraint(limit=n_steps, name="n_steps"),
            TimeoutConstraint(limit=timeout, name="t_spent"),
        )
        # Run batch train steps for as long as constraints allow it.
        stop_training = False
        if self.verbose:
            progress_bar = tqdm.tqdm(desc="Training round", unit=" steps")
        while not (stop_training or epochs.saturated):
            for batch in self.train_data.generate_batches(**batch_cfg):
                try:
                    self._run_train_step(batch)
                except StopIteration as exc:
                    self.logger.warning("Interrupting training round: %s", exc)
                    stop_training = True
                    break
                if self.verbose:
                    progress_bar.update()
                constraints.increment()
                if constraints.saturated:
                    stop_training = True
                    break
            epochs.increment()
        # Return a dict storing information on the training effort.
        effort = {"n_epoch": epochs.value}
        effort.update(constraints.get_values())
        return effort

    def _run_train_step(
        self,
        batch: Batch,
    ) -> None:
        """Run a single training step based on an input batch.

        Parameters
        ----------
        batch: Batch
            Batched data based on which to compute and apply model updates.

        Raises
        ------
        StopIteration
            If this step is being cancelled and the training routine
            in the context of which it is being called should stop.
        """
        self.optim.run_train_step(self.model, batch)

    def evaluation_round(
        self,
        message: messaging.EvaluationRequest,
    ) -> Union[messaging.EvaluationReply, messaging.Error]:
        """Run a local evaluation round.

        If an exception is raised during the local process, wrap it as
        an Error message instead of raising it.

        Parameters
        ----------
        message: EvaluationRequest
            Instructions from the server regarding the evaluation round.

        Returns
        -------
        reply: EvaluationReply or Error
            Message wrapping results from the evaluation round, or any
            error raised during it.
        """
        self.logger.info(
            "Participating in evaluation round %s", message.round_i
        )
        # Try running the evaluation round.
        try:
            return self._evaluation_round(message)
        # In case of failure, wrap the exception as an Error message.
        except Exception as exception:  # pylint: disable=broad-except
            self.logger.error(
                "Error encountered during evaluation: %s.", exception
            )
            return messaging.Error(repr(exception))

    def _evaluation_round(
        self,
        message: messaging.EvaluationRequest,
    ) -> messaging.EvaluationReply:
        """Backend to `evaluation_round`, without exception capture hooks."""
        # Update the model's weights and evaluate on the local dataset.
        if message.weights is not None:
            self.model.set_weights(message.weights, trainable=True)
        metrics, states, effort = self.evaluate_under_constraints(
            message.batches, message.n_steps, message.timeout
        )
        # Pack the resulting information into a message.
        self.logger.info("Packing local results to be sent to the server.")
        return messaging.EvaluationReply(
            loss=float(metrics["loss"]),
            metrics=states,
            n_steps=int(effort["n_steps"]),
            t_spent=round(effort["t_spent"], 3),
        )

    def evaluate_under_constraints(
        self,
        batch_cfg: Dict[str, Any],
        n_steps: Optional[int] = None,
        timeout: Optional[int] = None,
    ) -> Tuple[
        Dict[str, Union[float, np.ndarray]],
        Dict[str, MetricState],
        Dict[str, float],
    ]:
        """Run local loss computation under effort constraints.

        This is the core backend to the `evaluation_round` method,
        which further handles message parsing and passing, as well
        as exception catching.

        Parameters
        ----------
        batch_cfg: Dict[str, Any]
            Keyword arguments to `self.valid_data.generate_batches`.
        n_steps: int or None, default=None
            Maximum number of local evaluation steps to perform.
            May be overridden by `timeout` or dataset size.
        timeout: int or None, default=None
            Time (in seconds) beyond which to interrupt evaluation,
            regardless of the actual number of steps taken (> 0).

        Returns
        -------
        metrics:
            Computed metrics, as a dict with float or array values.
        states:
            Computed metrics, as partial values that may be shared
            with other agents to federatively compute final values
            with the same specs as `metrics`.
        effort:
            Dictionary storing information on the computational
            effort effectively performed:
            * n_epoch: int
                Number of evaluation epochs completed.
            * n_steps: int
                Number of evaluation steps completed.
            * t_spent: float
                Time spent running training steps (in seconds).
        """
        # Set up effort constraints under which to operate.
        constraints = ConstraintSet(
            Constraint(limit=n_steps, name="n_steps"),
            TimeoutConstraint(limit=timeout, name="t_spent"),
        )
        # Ensure evaluation metrics start from their base state.
        self.metrics.reset()
        # Run batch evaluation steps for as long as constraints allow it.
        dataset = self.valid_data or self.train_data
        if self.verbose:
            progress_bar = tqdm.tqdm(desc="Evaluation round", unit=" batches")
        for batch in dataset.generate_batches(**batch_cfg):
            inputs = self.model.compute_batch_predictions(batch)
            self.metrics.update(*inputs)
            if self.verbose:
                progress_bar.update()
            constraints.increment()
            if constraints.saturated:
                break
        # Gather the computed metrics and computational effort information.
        effort = constraints.get_values()
        values = self.metrics.get_result()
        states = self.metrics.get_states()
        self.logger.log(
            LOGGING_LEVEL_MAJOR,
            "Local scalar evaluation metrics: %s",
            {k: v for k, v in values.items() if isinstance(v, float)},
        )
        # Return the metrics' values, their states and the effort information.
        return values, states, effort

`init(model, optim, aggrg, train_data, valid_data=None, metrics=None, logger=None, verbose=True)`

Instantiate the client-side training and evaluation process.

Parameters:

Name	Type	Description	Default
`model`	`Model`	Model instance that needs training and/or evaluating.	required
`optim`	`Optimizer`	Optimizer instance that orchestrates training steps.	required
`aggrg`	`Aggregator`	Aggregator instance that is used to derive global model updates from peer-wise local ones.	required
`train_data`	`Dataset`	Dataset instance wrapping the local training dataset.	required
`valid_data`	`Optional[Dataset]`	Dataset instance wrapping the local validation dataset. If None, use `train_data` in the evaluation rounds.	`None`
`metrics`	`Union[MetricSet, List[MetricInputType], None]`	MetricSet instance or list of Metric instances and/or specs to wrap into one, defining evaluation metrics to compute in addition to the model's loss. If None, only compute and report the model's loss.	`None`
`logger`	`Union[logging.Logger, str, None]`	Logger to use, or name of a logger to set up with `declearn.utils.get_logger`. If None, use `type(self).__name__`.	`None`
`verbose`	`bool`	Whether to display progress bars when running training and validation rounds.	`True`

Source code in declearn/main/utils/_training.py

def __init__(
    self,
    model: Model,
    optim: Optimizer,
    aggrg: Aggregator,
    train_data: Dataset,
    valid_data: Optional[Dataset] = None,
    metrics: Union[MetricSet, List[MetricInputType], None] = None,
    logger: Union[logging.Logger, str, None] = None,
    verbose: bool = True,
) -> None:
    """Instantiate the client-side training and evaluation process.

    Parameters
    ----------
    model: Model
        Model instance that needs training and/or evaluating.
    optim: Optimizer
        Optimizer instance that orchestrates training steps.
    aggrg: Aggregator
        Aggregator instance that is used to derive global model
        updates from peer-wise local ones.
    train_data: Dataset
        Dataset instance wrapping the local training dataset.
    valid_data: Dataset or None, default=None
        Dataset instance wrapping the local validation dataset.
        If None, use `train_data` in the evaluation rounds.
    metrics: MetricSet or list[MetricInputType] or None, default=None
        MetricSet instance or list of Metric instances and/or specs
        to wrap into one, defining evaluation metrics to compute in
        addition to the model's loss.
        If None, only compute and report the model's loss.
    logger: logging.Logger or str or None, default=None,
        Logger to use, or name of a logger to set up with
        `declearn.utils.get_logger`.
        If None, use `type(self).__name__`.
    verbose: bool, default=True
        Whether to display progress bars when running training
        and validation rounds.
    """
    # arguments serve modularity; pylint: disable=too-many-arguments
    self.model = model
    self.optim = optim
    self.aggrg = aggrg
    self.train_data = train_data
    self.valid_data = valid_data
    self.metrics = self._prepare_metrics(metrics)
    if not isinstance(logger, logging.Logger):
        logger = get_logger(logger or f"{type(self).__name__}")
    self.logger = logger
    self.verbose = verbose

`evaluate_under_constraints(batch_cfg, n_steps=None, timeout=None)`

Run local loss computation under effort constraints.

This is the core backend to the evaluation_round method, which further handles message parsing and passing, as well as exception catching.

Parameters:

Name	Type	Description	Default
`batch_cfg`	`Dict[str, Any]`	Keyword arguments to `self.valid_data.generate_batches`.	required
`n_steps`	`Optional[int]`	Maximum number of local evaluation steps to perform. May be overridden by `timeout` or dataset size.	`None`
`timeout`	`Optional[int]`	Time (in seconds) beyond which to interrupt evaluation, regardless of the actual number of steps taken (> 0).	`None`

Returns:

Name	Type	Description
`metrics`	`Dict[str, Union[float, np.ndarray]]`	Computed metrics, as a dict with float or array values.
`states`	`Dict[str, MetricState]`	Computed metrics, as partial values that may be shared with other agents to federatively compute final values with the same specs as `metrics`.
`effort`	`Dict[str, float]`	Dictionary storing information on the computational effort effectively performed: * n_epoch: int Number of evaluation epochs completed. * n_steps: int Number of evaluation steps completed. * t_spent: float Time spent running training steps (in seconds).

Source code in declearn/main/utils/_training.py

def evaluate_under_constraints(
    self,
    batch_cfg: Dict[str, Any],
    n_steps: Optional[int] = None,
    timeout: Optional[int] = None,
) -> Tuple[
    Dict[str, Union[float, np.ndarray]],
    Dict[str, MetricState],
    Dict[str, float],
]:
    """Run local loss computation under effort constraints.

    This is the core backend to the `evaluation_round` method,
    which further handles message parsing and passing, as well
    as exception catching.

    Parameters
    ----------
    batch_cfg: Dict[str, Any]
        Keyword arguments to `self.valid_data.generate_batches`.
    n_steps: int or None, default=None
        Maximum number of local evaluation steps to perform.
        May be overridden by `timeout` or dataset size.
    timeout: int or None, default=None
        Time (in seconds) beyond which to interrupt evaluation,
        regardless of the actual number of steps taken (> 0).

    Returns
    -------
    metrics:
        Computed metrics, as a dict with float or array values.
    states:
        Computed metrics, as partial values that may be shared
        with other agents to federatively compute final values
        with the same specs as `metrics`.
    effort:
        Dictionary storing information on the computational
        effort effectively performed:
        * n_epoch: int
            Number of evaluation epochs completed.
        * n_steps: int
            Number of evaluation steps completed.
        * t_spent: float
            Time spent running training steps (in seconds).
    """
    # Set up effort constraints under which to operate.
    constraints = ConstraintSet(
        Constraint(limit=n_steps, name="n_steps"),
        TimeoutConstraint(limit=timeout, name="t_spent"),
    )
    # Ensure evaluation metrics start from their base state.
    self.metrics.reset()
    # Run batch evaluation steps for as long as constraints allow it.
    dataset = self.valid_data or self.train_data
    if self.verbose:
        progress_bar = tqdm.tqdm(desc="Evaluation round", unit=" batches")
    for batch in dataset.generate_batches(**batch_cfg):
        inputs = self.model.compute_batch_predictions(batch)
        self.metrics.update(*inputs)
        if self.verbose:
            progress_bar.update()
        constraints.increment()
        if constraints.saturated:
            break
    # Gather the computed metrics and computational effort information.
    effort = constraints.get_values()
    values = self.metrics.get_result()
    states = self.metrics.get_states()
    self.logger.log(
        LOGGING_LEVEL_MAJOR,
        "Local scalar evaluation metrics: %s",
        {k: v for k, v in values.items() if isinstance(v, float)},
    )
    # Return the metrics' values, their states and the effort information.
    return values, states, effort

`evaluation_round(message)`

Run a local evaluation round.

If an exception is raised during the local process, wrap it as an Error message instead of raising it.

Parameters:

Name	Type	Description	Default
`message`	`messaging.EvaluationRequest`	Instructions from the server regarding the evaluation round.	required

Returns:

Name	Type	Description
`reply`	`EvaluationReply or Error`	Message wrapping results from the evaluation round, or any error raised during it.

Source code in declearn/main/utils/_training.py

def evaluation_round(
    self,
    message: messaging.EvaluationRequest,
) -> Union[messaging.EvaluationReply, messaging.Error]:
    """Run a local evaluation round.

    If an exception is raised during the local process, wrap it as
    an Error message instead of raising it.

    Parameters
    ----------
    message: EvaluationRequest
        Instructions from the server regarding the evaluation round.

    Returns
    -------
    reply: EvaluationReply or Error
        Message wrapping results from the evaluation round, or any
        error raised during it.
    """
    self.logger.info(
        "Participating in evaluation round %s", message.round_i
    )
    # Try running the evaluation round.
    try:
        return self._evaluation_round(message)
    # In case of failure, wrap the exception as an Error message.
    except Exception as exception:  # pylint: disable=broad-except
        self.logger.error(
            "Error encountered during evaluation: %s.", exception
        )
        return messaging.Error(repr(exception))

`train_under_constraints(batch_cfg, n_epoch=1, n_steps=None, timeout=None)`

Run local SGD steps under effort constraints.

This is the core backend to the training_round method, which further handles message parsing and passing, as well as exception catching.

Parameters:

Name	Type	Description	Default
`batch_cfg`	`Dict[str, Any]`	Keyword arguments for `self.train_data.generate_batches` i.e. specifications of batches used in local SGD steps.	required
`n_epoch`	`Optional[int]`	Maximum number of local training epochs to perform. May be overridden by `n_steps` or `timeout`.	`1`
`n_steps`	`Optional[int]`	Maximum number of local training steps to perform. May be overridden by `n_epoch` or `timeout`.	`None`
`timeout`	`Optional[int]`	Time (in seconds) beyond which to interrupt training, regardless of the actual number of steps taken (> 0).	`None`

Returns:

Name	Type	Description
`effort`	`dict[str, float]`	Dictionary storing information on the computational effort effectively performed: * n_epoch: int Number of training epochs completed. * n_steps: int Number of training steps completed. * t_spent: float Time spent running training steps (in seconds).

Source code in declearn/main/utils/_training.py

def train_under_constraints(
    self,
    batch_cfg: Dict[str, Any],
    n_epoch: Optional[int] = 1,
    n_steps: Optional[int] = None,
    timeout: Optional[int] = None,
) -> Dict[str, float]:
    """Run local SGD steps under effort constraints.

    This is the core backend to the `training_round` method,
    which further handles message parsing and passing, as well
    as exception catching.

    Parameters
    ----------
    batch_cfg: Dict[str, Any]
        Keyword arguments for `self.train_data.generate_batches`
        i.e. specifications of batches used in local SGD steps.
    n_epoch: int or None, default=1
        Maximum number of local training epochs to perform.
        May be overridden by `n_steps` or `timeout`.
    n_steps: int or None, default=None
        Maximum number of local training steps to perform.
        May be overridden by `n_epoch` or `timeout`.
    timeout: int or None, default=None
        Time (in seconds) beyond which to interrupt training,
        regardless of the actual number of steps taken (> 0).

    Returns
    -------
    effort: dict[str, float]
        Dictionary storing information on the computational
        effort effectively performed:
        * n_epoch: int
            Number of training epochs completed.
        * n_steps: int
            Number of training steps completed.
        * t_spent: float
            Time spent running training steps (in seconds).
    """
    # Set up effort constraints under which to operate.
    epochs = Constraint(limit=n_epoch, name="n_epoch")
    constraints = ConstraintSet(
        Constraint(limit=n_steps, name="n_steps"),
        TimeoutConstraint(limit=timeout, name="t_spent"),
    )
    # Run batch train steps for as long as constraints allow it.
    stop_training = False
    if self.verbose:
        progress_bar = tqdm.tqdm(desc="Training round", unit=" steps")
    while not (stop_training or epochs.saturated):
        for batch in self.train_data.generate_batches(**batch_cfg):
            try:
                self._run_train_step(batch)
            except StopIteration as exc:
                self.logger.warning("Interrupting training round: %s", exc)
                stop_training = True
                break
            if self.verbose:
                progress_bar.update()
            constraints.increment()
            if constraints.saturated:
                stop_training = True
                break
        epochs.increment()
    # Return a dict storing information on the training effort.
    effort = {"n_epoch": epochs.value}
    effort.update(constraints.get_values())
    return effort

`training_round(message)`

Run a local training round.

If an exception is raised during the local process, wrap it as an Error message instead of raising it.

Parameters:

Name	Type	Description	Default
`message`	`messaging.TrainRequest`	Instructions from the server regarding the training round.	required

Returns:

Name	Type	Description
`reply`	`TrainReply or Error`	Message wrapping results from the training round, or any error raised during it.

Source code in declearn/main/utils/_training.py

def training_round(
    self,
    message: messaging.TrainRequest,
) -> Union[messaging.TrainReply, messaging.Error]:
    """Run a local training round.

    If an exception is raised during the local process, wrap it as
    an Error message instead of raising it.

    Parameters
    ----------
    message: TrainRequest
        Instructions from the server regarding the training round.

    Returns
    -------
    reply: TrainReply or Error
        Message wrapping results from the training round, or any
        error raised during it.
    """
    self.logger.info("Participating in training round %s", message.round_i)
    # Try running the training round; return the reply is successful.
    try:
        return self._training_round(message)
    # In case of failure, wrap the exception as an Error message.
    except Exception as exception:  # pylint: disable=broad-except
        self.logger.error(
            "Error encountered during training: %s.", exception
        )
        return messaging.Error(repr(exception))

declearn.main.utils.TrainingManager

__init__(model, optim, aggrg, train_data, valid_data=None, metrics=None, logger=None, verbose=True)

evaluate_under_constraints(batch_cfg, n_steps=None, timeout=None)

evaluation_round(message)

train_under_constraints(batch_cfg, n_epoch=1, n_steps=None, timeout=None)

training_round(message)

`declearn.main.utils.TrainingManager`

`init(model, optim, aggrg, train_data, valid_data=None, metrics=None, logger=None, verbose=True)`

`evaluate_under_constraints(batch_cfg, n_steps=None, timeout=None)`

`evaluation_round(message)`

`train_under_constraints(batch_cfg, n_epoch=1, n_steps=None, timeout=None)`

`training_round(message)`