Source code for unilab.training.seed

"""Shared training seed contract helpers."""

from __future__ import annotations

import random
from dataclasses import dataclass
from typing import Any

import numpy as np
from omegaconf import OmegaConf



[docs]
@dataclass(frozen=True)
class TrainingSeedInfo:
    """Configured and effective seed metadata for a training run."""

    configured_seed: int | None
    configured_seed_source: str | None
    effective_seed: int | None


[docs]
    def to_dict(self) -> dict[str, int | str | None]:
        return {
            "configured_seed": self.configured_seed,
            "configured_seed_source": self.configured_seed_source,
            "effective_seed": self.effective_seed,
        }




def _select_seed(cfg: Any, path: str) -> Any:
    if OmegaConf.is_config(cfg):
        return OmegaConf.select(cfg, path, default=None)

    current = cfg
    for part in path.split("."):
        if current is None:
            return None
        if isinstance(current, dict):
            current = current.get(part)
        else:
            current = getattr(current, part, None)
    return current



[docs]
def resolve_training_seed(cfg: Any) -> TrainingSeedInfo:
    """Resolve the configured seed, preferring the algorithm-level contract."""
    candidates = (
        ("algo.seed", _select_seed(cfg, "algo.seed")),
        ("training.seed", _select_seed(cfg, "training.seed")),
    )
    for source, raw_seed in candidates:
        if raw_seed is None:
            continue
        seed = int(raw_seed)
        if seed < 0:
            raise ValueError(f"{source} must be non-negative, got {seed}")
        return TrainingSeedInfo(
            configured_seed=seed,
            configured_seed_source=source,
            effective_seed=seed,
        )
    return TrainingSeedInfo(configured_seed=None, configured_seed_source=None, effective_seed=None)




[docs]
def derive_worker_seed(base_seed: int | None, worker_index: int = 0) -> int | None:
    """Derive deterministic subprocess seeds from the effective run seed."""
    if base_seed is None:
        return None
    if worker_index < 0:
        raise ValueError(f"worker_index must be non-negative, got {worker_index}")
    return int(base_seed) + int(worker_index) + 1




[docs]
def apply_training_seed(
    seed: int | None,
    *,
    torch_runtime: bool = True,
    cuda: bool = True,
    mlx_runtime: bool = False,
) -> int | None:
    """Apply a seed to the runtimes used by training entrypoints."""
    if seed is None:
        return None

    effective_seed = int(seed)
    if effective_seed < 0:
        raise ValueError(f"seed must be non-negative, got {effective_seed}")

    random.seed(effective_seed)
    np.random.seed(effective_seed)

    if torch_runtime:
        try:
            import torch
        except ImportError:
            torch = None
        if torch is not None:
            torch.manual_seed(effective_seed)
            if cuda and torch.cuda.is_available():
                torch.cuda.manual_seed_all(effective_seed)

    if mlx_runtime:
        try:
            import mlx.core as mx
        except ImportError:
            mx = None
        if mx is not None:
            mx.random.seed(effective_seed)

    return effective_seed




[docs]
def apply_configured_training_seed(
    cfg: Any,
    *,
    torch_runtime: bool = True,
    cuda: bool = True,
    mlx_runtime: bool = False,
) -> TrainingSeedInfo:
    """Resolve and apply the configured training seed before runtime construction."""
    seed_info = resolve_training_seed(cfg)
    effective_seed = apply_training_seed(
        seed_info.effective_seed,
        torch_runtime=torch_runtime,
        cuda=cuda,
        mlx_runtime=mlx_runtime,
    )
    return TrainingSeedInfo(
        configured_seed=seed_info.configured_seed,
        configured_seed_source=seed_info.configured_seed_source,
        effective_seed=effective_seed,
    )