Source code for optuna_integration.trackio.trackio

from __future__ import annotations

from collections.abc import Callable
from collections.abc import Sequence
import functools
from typing import Any
from typing import cast
from typing import TYPE_CHECKING

import optuna
from optuna._deprecated import deprecated_class
from optuna._imports import try_import


with try_import() as _imports:
    import trackio


if TYPE_CHECKING:
    from optuna.study.study import ObjectiveFuncType



[docs]
@deprecated_class("4.9.0", "6.0.0")
class TrackioCallback:
    """Callback to track Optuna trials with Trackio.

    This callback enables tracking of an Optuna study using Trackio.
    By default, the entire study is recorded as a single experiment run,
    where all suggested hyperparameters and optimized metrics are logged
    and visualized as a function of optimizer steps.

    Trackio is offline-first and does not require authentication for local
    usage. Optionally, results can be synchronized to Hugging Face Spaces
    or exported as Hugging Face Datasets for sharing, visualization, and
    reproducibility.

    .. note::
        Trackio does not require users to be logged in for local experiment
        tracking. Authentication is only required when synchronizing results
        to Hugging Face Hub (e.g., Spaces or Datasets).

    .. note::
        Unlike Weights & Biases, Trackio does not rely on global mutable state.
        Each run is explicitly initialized and finalized, which makes this
        callback safe to use in long-running processes and research pipelines.

    .. note::
        To ensure deterministic trial ordering in logged metrics, this
        callback should only be used with ``study.optimize(n_jobs=1)``.
        Parallel optimization may result in out-of-order steps.

    Example:

        Add Trackio callback to Optuna optimization.

        .. code-block:: python

            import optuna
            from optuna_integration.trackio import TrackioCallback


            def objective(trial):
                x = trial.suggest_float("x", -10, 10)
                return (x - 2) ** 2


            study = optuna.create_study()

            trackioc = TrackioCallback(project="my-optuna-study")

            study.optimize(objective, n_trials=10, callbacks=[trackioc])


        Trackio logging in multi-run (one run per trial) mode.

        .. code-block:: python

            import optuna
            from optuna_integration.trackio import TrackioCallback


            trackioc = TrackioCallback(
                project="my-optuna-study",
                as_multirun=True,
            )


            # Required when logging per-trial runs
            @trackioc.track_in_trackio()
            def objective(trial):
                x = trial.suggest_float("x", -10, 10)
                return (x - 2) ** 2


            study = optuna.create_study()
            study.optimize(objective, n_trials=10, callbacks=[trackioc])


        Publishing results to a Hugging Face Space.

        .. code-block:: python

            trackioc = TrackioCallback(
                project="my-optuna-study",
                space_id="username/optuna-dashboard",
                as_multirun=True,
            )


    Args:
        project:
            Name of the Trackio project. This determines the local storage
            directory and is also used when synchronizing results to a
            Hugging Face Space or Dataset.

        metric_name:
            Name assigned to the optimized metric. In case of multi-objective
            optimization, a sequence of names can be provided. These names
            are assigned to objective values in the order returned by the
            objective function.

            If a single name is provided (default: ``"value"``), it will be
            broadcast to multiple objectives using a numerical suffix,
            e.g., ``value_0``, ``value_1``.

            The number of metric names must match the number of objective
            values returned.

        as_multirun:
            If ``True``, creates a new Trackio run for each Optuna trial.
            This is useful for per-trial analysis, parameter importance
            visualizations, and sweep-style dashboards.

            If ``False`` (default), all trials are logged into a single run.

        space_id:
            Optional Hugging Face Space ID (``"username/space-name"``) to
            which the tracked project will be synchronized. If the Space
            does not exist, it will be created automatically.

        dataset_id:
            Optional Hugging Face Dataset ID (``"username/dataset-name"``)
            used to export trial metrics and parameters as a versioned
            dataset for offline analysis and reproducibility.

        private:
            Whether the Hugging Face Space or Dataset should be private.
            Defaults to the user or organization’s Hub settings.

        resume:
            Resume behavior when initializing Trackio runs. This is
            particularly relevant for Optuna studies that may be restarted
            or retried. Accepted values are ``"allow"``, ``"must"``, and
            ``"never"``. The default ``"allow"`` enables safe resumption of
            existing runs while avoiding run name collisions.

        trackio_kwargs:
            Additional keyword arguments passed to :func:`trackio.init`,
            such as ``resume`` or UI-related configuration options.
    """

    def __init__(
        self,
        project: str,
        metric_name: str | Sequence[str] = "value",
        *,
        as_multirun: bool = False,
        space_id: str | None = None,
        dataset_id: str | None = None,
        private: bool | None = None,
        resume: str = "allow",
        trackio_kwargs: dict[str, Any] | None = None,
    ) -> None:
        _imports.check()

        if not isinstance(metric_name, (str, Sequence)):
            raise TypeError(f"metric_name must be str or sequence[str], got {type(metric_name)}")

        self._project: str = project
        self._metric_name: str | Sequence[str] = metric_name
        self._as_multirun: bool = as_multirun
        self._space_id: str | None = space_id  # HF inits for trackio
        self._dataset_id: str | None = dataset_id
        self._private: bool | None = private
        self._resume: str = resume
        self._trackio_kwargs: dict[str, Any] = trackio_kwargs or {}

        # Explicit internal state (DO NOT infer from Trackio, will cause errors)
        self._objective_wrapped: bool = False
        self._base_run_name: str | None = None
        self._active_trial_number: int | None = None

    def __call__(
        self,
        _study: optuna.study.Study,
        trial: optuna.trial.FrozenTrial,
    ) -> None:
        if self._base_run_name is None:
            self._base_run_name = _study.study_name
        if trial.values is None:
            return

        # If the objective was not wrapped, we cannot safely log
        if not self._objective_wrapped:
            if self._as_multirun:
                print(
                    "TrackioCallback(as_multirun=True) requires the objective to be "
                    "wrapped with @trackioc.track_in_trackio(). "
                )
            return

        metrics = self._build_metrics(trial)

        # Safe wrapper guarantees a live Trackio run
        trackio.log(
            {
                **trial.params,
                **metrics,
                "trial_number": trial.number,
            },
            step=trial.number,
        )


[docs]
    def track_in_trackio(self) -> Callable:
        """Decorator for enabling Trackio logging inside the objective function.

        This decorator wraps an Optuna objective function so that a Trackio run
        is initialized before the objective executes and finalized afterward.
        Any calls to :func:`trackio.log` inside the objective will be associated
        with the correct run.

        The decorator is required when logging from inside the objective
        function, since Optuna callbacks are invoked *after* a trial finishes
        and therefore cannot manage per-trial runtime state.

        When ``as_multirun=True``, a separate Trackio run is created for each
        Optuna trial. When ``as_multirun=False``, all trials are logged into a
        single run.

        Example:

            Add additional logging inside the objective function.

            .. code-block:: python

                import optuna
                import trackio
                from optuna_integration.trackio import TrackioCallback

                trackioc = TrackioCallback(
                    project="my-optuna-study",
                    as_multirun=True,
                )


                @trackioc.track_in_trackio()
                def objective(trial: optuna.trial.Trial) -> float:
                    x = trial.suggest_float("x", -10, 10)

                    # Log custom metrics inside the objective
                    trackio.log({"x": x, "loss_squared": (x - 2) ** 2})

                    return (x - 2) ** 2


                study = optuna.create_study()
                study.optimize(objective, n_trials=10, callbacks=[trackioc])

        Returns:
            A wrapped objective function with Trackio logging enabled.
        """

        def decorator(func: ObjectiveFuncType) -> ObjectiveFuncType:
            self._objective_wrapped = True  # explicit contract
            wrapped = self._wrap_objective(func)

            @functools.wraps(func)
            def wrapper(trial: optuna.trial.Trial) -> Any:
                return wrapped(trial)

            return wrapper

        return decorator


    def _wrap_objective(self, func: ObjectiveFuncType) -> ObjectiveFuncType:
        @functools.wraps(func)
        def wrapped(trial: optuna.trial.Trial) -> Any:
            base_name = self._base_run_name or "optuna-study"

            if self._as_multirun:
                run_name = f"trial/{trial.number}/{base_name}"
                self._active_trial_number = trial.number
            else:
                run_name = base_name

            trackio.init(
                project=self._project,
                name=run_name,
                space_id=self._space_id,
                dataset_id=self._dataset_id,
                private=self._private,
                resume=self._resume,
                **self._trackio_kwargs,
            )

            try:
                return func(trial)

            except optuna.exceptions.TrialPruned:
                trackio.log({"trial_state": "pruned"})
                raise

            except Exception as exc:
                trackio.log({"trial_state": "failed", "error": str(exc)})
                raise

            finally:
                if self._as_multirun:
                    cast(Any, trackio).finish()
                    self._active_trial_number = None

        return wrapped

    def _build_metrics(self, trial: optuna.trial.FrozenTrial) -> dict[str, float]:
        values = trial.values
        assert values is not None

        if isinstance(self._metric_name, str):
            if len(values) == 1:
                names = [self._metric_name]
            else:
                names = [f"{self._metric_name}_{i}" for i in range(len(values))]
        else:
            if len(self._metric_name) != len(values):
                raise ValueError(
                    "Metric names must match number of objectives "
                    f"({len(self._metric_name)} vs {len(values)})"
                )
            names = list(self._metric_name)

        return dict(zip(names, values))