openg2g.controller¶

`openg2g.controller.base` ¶

Abstract base class for controllers.

`Controller` ¶

Bases: Generic[DCBackendT, GridBackendT], ABC

Interface for a control component in the G2G framework.

Controllers receive datacenter and grid state and produce control actions. Multiple controllers compose in order within the coordinator.

Source code in openg2g/controller/base.py

class Controller(Generic[DCBackendT, GridBackendT], ABC):
    """Interface for a control component in the G2G framework.

    Controllers receive datacenter and grid state and produce control actions.
    Multiple controllers compose in order within the coordinator.
    """

    _dc_types: tuple[type[DatacenterBackend], ...] = (DatacenterBackend,)
    _grid_types: tuple[type[GridBackend], ...] = (GridBackend,)

    def __init_subclass__(cls, **kwargs: object) -> None:
        super().__init_subclass__(**kwargs)
        dc_types: tuple[type[DatacenterBackend], ...] | None = None
        grid_types: tuple[type[GridBackend], ...] | None = None
        for base in getattr(cls, "__orig_bases__", ()):
            if get_origin(base) is Controller:
                args = get_args(base)
                if len(args) != 2:
                    raise TypeError(
                        f"{cls.__name__} must specialize Controller with two generic args: "
                        "Controller[DatacenterType, GridType]."
                    )
                dc_raw, grid_raw = args
                dc_norm = _normalize_backend_type_arg(dc_raw, required_base=DatacenterBackend)
                grid_norm = _normalize_backend_type_arg(grid_raw, required_base=GridBackend)
                dc_types = tuple(t for t in dc_norm if issubclass(t, DatacenterBackend))
                grid_types = tuple(t for t in grid_norm if issubclass(t, GridBackend))
                break

        if dc_types is None or grid_types is None:
            inherited = [b for b in cls.__bases__ if issubclass(b, Controller)]
            inherited = [b for b in inherited if b is not Controller]
            if inherited:
                parent = inherited[0]
                cls._dc_types = parent.compatible_datacenter_types()
                cls._grid_types = parent.compatible_grid_types()
                return
            raise TypeError(
                f"{cls.__name__} must explicitly specialize Controller generics as "
                "Controller[DatacenterType, GridType]."
            )

        cls._dc_types = dc_types
        cls._grid_types = grid_types

    @classmethod
    def compatible_datacenter_types(cls) -> tuple[type[DatacenterBackend], ...]:
        return cls._dc_types

    @classmethod
    def compatible_grid_types(cls) -> tuple[type[GridBackend], ...]:
        return cls._grid_types

    @classmethod
    def compatibility_signature(cls) -> str:
        dc = " | ".join(t.__name__ for t in cls.compatible_datacenter_types())
        grid = " | ".join(t.__name__ for t in cls.compatible_grid_types())
        return f"Controller[{dc}, {grid}]"

    @property
    @abstractmethod
    def dt_s(self) -> Fraction:
        """Control interval as a Fraction (seconds)."""

    @abstractmethod
    def reset(self) -> None:
        """Reset simulation state to initial conditions.

        Called by the coordinator before each `start()`. Must clear all
        simulation state: dual variables, counters, cached matrices.
        Configuration (dt_s, fits, step sizes) is not affected.

        Abstract so every implementation explicitly enumerates its state.
        A forgotten field is a bug -- not clearing it silently corrupts
        the second run.
        """

    def start(self) -> None:
        """Acquire per-run resources.

        Called after `reset()`, before the simulation loop. No-op by
        default because most controllers have no resources to acquire.
        """

    def stop(self) -> None:
        """Release per-run resources. Simulation state is preserved.

        Called after the simulation loop in LIFO order. No-op by default.
        """

    @abstractmethod
    def step(
        self,
        clock: SimulationClock,
        datacenter: DCBackendT,
        grid: GridBackendT,
        events: EventEmitter,
    ) -> ControlAction | Sequence[ControlAction]:
        """Compute one or more control actions. Must complete synchronously."""

`dt_s` `abstractmethod` `property` ¶

Control interval as a Fraction (seconds).

`reset()` `abstractmethod` ¶

Reset simulation state to initial conditions.

Called by the coordinator before each start(). Must clear all simulation state: dual variables, counters, cached matrices. Configuration (dt_s, fits, step sizes) is not affected.

Abstract so every implementation explicitly enumerates its state. A forgotten field is a bug -- not clearing it silently corrupts the second run.

Source code in openg2g/controller/base.py

@abstractmethod
def reset(self) -> None:
    """Reset simulation state to initial conditions.

    Called by the coordinator before each `start()`. Must clear all
    simulation state: dual variables, counters, cached matrices.
    Configuration (dt_s, fits, step sizes) is not affected.

    Abstract so every implementation explicitly enumerates its state.
    A forgotten field is a bug -- not clearing it silently corrupts
    the second run.
    """

`start()` ¶

Acquire per-run resources.

Called after reset(), before the simulation loop. No-op by default because most controllers have no resources to acquire.

Source code in openg2g/controller/base.py

def start(self) -> None:
    """Acquire per-run resources.

    Called after `reset()`, before the simulation loop. No-op by
    default because most controllers have no resources to acquire.
    """

`stop()` ¶

Release per-run resources. Simulation state is preserved.

Called after the simulation loop in LIFO order. No-op by default.

Source code in openg2g/controller/base.py

def stop(self) -> None:
    """Release per-run resources. Simulation state is preserved.

    Called after the simulation loop in LIFO order. No-op by default.
    """

`step(clock, datacenter, grid, events)` `abstractmethod` ¶

Compute one or more control actions. Must complete synchronously.

Source code in openg2g/controller/base.py

@abstractmethod
def step(
    self,
    clock: SimulationClock,
    datacenter: DCBackendT,
    grid: GridBackendT,
    events: EventEmitter,
) -> ControlAction | Sequence[ControlAction]:
    """Compute one or more control actions. Must complete synchronously."""

`openg2g.controller.batch_size_schedule` ¶

Batch size schedule controller: applies pre-defined batch size changes at specified times.

`BatchSizeChange` `dataclass` ¶

A batch size change event, optionally with gradual ramp-up.

Parameters:

Name	Type	Description	Default
`batch_size`	`int`	Target batch size (max_num_seqs).	required
`ramp_up_rate`	`float`	Requests/second ramp-up rate. 0 means immediate.	`0.0`

Source code in openg2g/controller/batch_size_schedule.py

@dataclass(frozen=True)
class BatchSizeChange:
    """A batch size change event, optionally with gradual ramp-up.

    Args:
        batch_size: Target batch size (max_num_seqs).
        ramp_up_rate: Requests/second ramp-up rate. 0 means immediate.
    """

    batch_size: int
    ramp_up_rate: float = 0.0

    def __post_init__(self) -> None:
        if self.batch_size <= 0:
            raise ValueError(f"batch_size must be positive, got {self.batch_size}.")
        if self.ramp_up_rate < 0:
            raise ValueError(f"ramp_up_rate must be >= 0, got {self.ramp_up_rate}.")

    def at(self, t: float) -> BatchSizeSchedule:
        """Schedule this change at time *t* seconds."""
        return BatchSizeSchedule(((t, self),))

`at(t)` ¶

Schedule this change at time t seconds.

Source code in openg2g/controller/batch_size_schedule.py

def at(self, t: float) -> BatchSizeSchedule:
    """Schedule this change at time *t* seconds."""
    return BatchSizeSchedule(((t, self),))

`BatchSizeSchedule` ¶

Ordered sequence of batch size changes, built with | operator.

Example:

schedule = (
    BatchSizeChange(48).at(40)
    | BatchSizeChange(32).at(60)
    | BatchSizeChange(48, ramp_up_rate=4).at(280)
)

Raises:

Type	Description
`ValueError`	If two entries share the same timestamp.

Source code in openg2g/controller/batch_size_schedule.py

class BatchSizeSchedule:
    """Ordered sequence of batch size changes, built with `|` operator.

    Example:

        schedule = (
            BatchSizeChange(48).at(40)
            | BatchSizeChange(32).at(60)
            | BatchSizeChange(48, ramp_up_rate=4).at(280)
        )

    Raises:
        ValueError: If two entries share the same timestamp.
    """

    __slots__ = ("_entries",)

    def __init__(self, entries: tuple[tuple[float, BatchSizeChange], ...]) -> None:
        self._entries = tuple(sorted(entries, key=lambda e: e[0]))
        times = [t for t, _ in self._entries]
        if len(times) != len(set(times)):
            seen: set[float] = set()
            dupes = sorted({t for t in times if t in seen or seen.add(t)})
            raise ValueError(f"BatchSizeSchedule has duplicate timestamps: {dupes}")

    def __or__(self, other: BatchSizeSchedule) -> BatchSizeSchedule:
        return BatchSizeSchedule(self._entries + other._entries)

    def __iter__(self) -> Iterator[tuple[float, BatchSizeChange]]:
        return iter(self._entries)

    def __len__(self) -> int:
        return len(self._entries)

    def __bool__(self) -> bool:
        return bool(self._entries)

    def __repr__(self) -> str:
        parts: list[str] = []
        for t, c in self._entries:
            ramp = f", ramp_up_rate={c.ramp_up_rate}" if c.ramp_up_rate > 0 else ""
            parts.append(f"BatchSizeChange({c.batch_size}{ramp}).at(t={t})")
        return " | ".join(parts)

`BatchSizeScheduleController` ¶

Bases: Controller[DatacenterBackend, GridBackend]

Applies pre-defined batch size changes at scheduled times.

Walks each model's schedule and emits set_batch_size commands when the simulation clock reaches the scheduled time.

Parameters:

Name	Type	Description	Default
`schedules`	`dict[str, BatchSizeSchedule]`	Per-model batch size schedules, keyed by model label.	required
`dt_s`	`Fraction`	How often the controller checks the schedule (seconds).	`Fraction(1)`

Source code in openg2g/controller/batch_size_schedule.py

class BatchSizeScheduleController(Controller[DatacenterBackend, GridBackend]):
    """Applies pre-defined batch size changes at scheduled times.

    Walks each model's schedule and emits `set_batch_size` commands when
    the simulation clock reaches the scheduled time.

    Args:
        schedules: Per-model batch size schedules, keyed by model label.
        dt_s: How often the controller checks the schedule (seconds).
    """

    def __init__(
        self,
        *,
        schedules: dict[str, BatchSizeSchedule],
        dt_s: Fraction = Fraction(1),
    ) -> None:
        self._dt_s = dt_s
        self._schedules = dict(schedules)
        self._indices: dict[str, int] = {label: 0 for label in schedules}

    def reset(self) -> None:
        self._indices = {label: 0 for label in self._schedules}

    @property
    def dt_s(self) -> Fraction:
        return self._dt_s

    def step(
        self,
        clock: SimulationClock,
        datacenter: DatacenterBackend,
        grid: GridBackend,
        events: EventEmitter,
    ) -> ControlAction:
        t_now = clock.time_s
        batch_changes: dict[str, int] = {}
        ramp_rates: dict[str, float] = {}

        for label, schedule in self._schedules.items():
            entries = list(schedule)
            idx = self._indices[label]

            while idx < len(entries):
                t_ev, change = entries[idx]
                if float(t_ev) <= t_now + 1e-12:
                    batch_changes[label] = change.batch_size
                    if change.ramp_up_rate > 0:
                        ramp_rates[label] = change.ramp_up_rate
                    idx += 1
                else:
                    break

            self._indices[label] = idx

        if batch_changes:
            return ControlAction(
                commands=[
                    SetBatchSize(
                        batch_size_by_model=batch_changes,
                        ramp_up_rate_by_model=ramp_rates,
                    )
                ]
            )
        return ControlAction(commands=[])

`start()` ¶

Acquire per-run resources.

Called after reset(), before the simulation loop. No-op by default because most controllers have no resources to acquire.

Source code in openg2g/controller/base.py

def start(self) -> None:
    """Acquire per-run resources.

    Called after `reset()`, before the simulation loop. No-op by
    default because most controllers have no resources to acquire.
    """

`stop()` ¶

Release per-run resources. Simulation state is preserved.

Called after the simulation loop in LIFO order. No-op by default.

Source code in openg2g/controller/base.py

def stop(self) -> None:
    """Release per-run resources. Simulation state is preserved.

    Called after the simulation loop in LIFO order. No-op by default.
    """

`openg2g.controller.noop` ¶

No-op controller that does nothing.

`NoopController` ¶

Bases: Controller[DatacenterBackend, GridBackend]

Controller that always returns an empty action.

Source code in openg2g/controller/noop.py

class NoopController(Controller[DatacenterBackend, GridBackend]):
    """Controller that always returns an empty action."""

    def __init__(self, dt_s: Fraction = Fraction(1)) -> None:
        self._dt_s = dt_s

    @property
    def dt_s(self) -> Fraction:
        return self._dt_s

    def reset(self) -> None:
        pass

    def step(
        self,
        clock: SimulationClock,
        datacenter: DatacenterBackend,
        grid: GridBackend,
        events: EventEmitter,
    ) -> ControlAction:
        return ControlAction(commands=[])

`start()` ¶

Acquire per-run resources.

Called after reset(), before the simulation loop. No-op by default because most controllers have no resources to acquire.

Source code in openg2g/controller/base.py

def start(self) -> None:
    """Acquire per-run resources.

    Called after `reset()`, before the simulation loop. No-op by
    default because most controllers have no resources to acquire.
    """

`stop()` ¶

Release per-run resources. Simulation state is preserved.

Called after the simulation loop in LIFO order. No-op by default.

Source code in openg2g/controller/base.py

def stop(self) -> None:
    """Release per-run resources. Simulation state is preserved.

    Called after the simulation loop in LIFO order. No-op by default.
    """

`openg2g.controller.ofo` ¶

Online Feedback Optimization (OFO) batch-size controller.

Implements the primal-dual algorithm for joint voltage regulation and latency management via GPU batch size control.

`VoltageDualConfig` `dataclass` ¶

Configuration for the voltage dual variable update.

Attributes:

Name	Type	Description
`v_min`	`float`	Lower voltage limit (pu).
`v_max`	`float`	Upper voltage limit (pu).
`ascent_step_size`	`float`	Step size for the voltage dual ascent (ρ_v in G2G paper Eqs. 5-6).

Source code in openg2g/controller/ofo.py

@dataclass
class VoltageDualConfig:
    """Configuration for the voltage dual variable update.

    Attributes:
        v_min: Lower voltage limit (pu).
        v_max: Upper voltage limit (pu).
        ascent_step_size: Step size for the voltage dual ascent (ρ_v in G2G paper Eqs. 5-6).
    """

    v_min: float = 0.95
    v_max: float = 1.05
    ascent_step_size: float = 0.5  # ρ_v in G2G paper Eqs. 5-6

`PrimalConfig` `dataclass` ¶

Configuration for the primal batch-size optimizer.

Attributes:

Name	Type	Description
`descent_step_size`	`float`	Primal gradient descent step size (ρ_x in G2G paper Eq. 8).
`w_throughput`	`float`	Weight on the (negative) throughput gradient.
`w_switch`	`float`	Weight on the switching cost regularizer `gamma * \|\|x - x_prev\|\|^2` (γ in G2G paper Eq. 4a).
`voltage_gradient_scale`	`float`	Scaling factor applied to the voltage gradient term. Multiplies `eta^T H e_i dP/dx`. Not present in the G2G paper's equations; used here as a tuning knob.

Source code in openg2g/controller/ofo.py

@dataclass
class PrimalConfig:
    """Configuration for the primal batch-size optimizer.

    Attributes:
        descent_step_size: Primal gradient descent step size (ρ_x in G2G paper Eq. 8).
        w_throughput: Weight on the (negative) throughput gradient.
        w_switch: Weight on the switching cost regularizer
            `gamma * ||x - x_prev||^2` (γ in G2G paper Eq. 4a).
        voltage_gradient_scale: Scaling factor applied to the voltage gradient
            term.  Multiplies `eta^T H e_i dP/dx`.  Not present in the G2G
            paper's equations; used here as a tuning knob.
    """

    descent_step_size: float = 0.05  # ρ_x in G2G paper Eq. 8
    w_throughput: float = 0.1
    w_switch: float = 0.0
    voltage_gradient_scale: float = 1e6

`VoltageDualVariables` ¶

Full-network duals for voltage box constraints.

Maintains per-bus dual variables for under- and overvoltage and updates them via projected gradient ascent:

dual_undervoltage  <- [dual_undervoltage  + ρ_v * (v_min - v̂)]+
dual_overvoltage   <- [dual_overvoltage   + ρ_v * (v̂ - v_max)]+

Parameters:

Name	Type	Description	Default
`n_bus_phases`	`int`	Number of bus-phase pairs in the voltage vector (3M).	required
`config`	`VoltageDualConfig`	Voltage dual configuration (bounds and step size).	required

Source code in openg2g/controller/ofo.py

class VoltageDualVariables:
    """Full-network duals for voltage box constraints.

    Maintains per-bus dual variables for under- and overvoltage and updates
    them via projected gradient ascent:

        dual_undervoltage  <- [dual_undervoltage  + ρ_v * (v_min - v̂)]+
        dual_overvoltage   <- [dual_overvoltage   + ρ_v * (v̂ - v_max)]+

    Args:
        n_bus_phases: Number of bus-phase pairs in the voltage vector (3M).
        config: Voltage dual configuration (bounds and step size).
    """

    def __init__(self, n_bus_phases: int, config: VoltageDualConfig) -> None:
        self.config = config
        self.dual_undervoltage = np.zeros(int(n_bus_phases), dtype=float)  # λ in G2G paper Eq. 5
        self.dual_overvoltage = np.zeros(int(n_bus_phases), dtype=float)  # λ̄ in G2G paper Eq. 6

    def update(self, observed_voltages: np.ndarray) -> None:
        """Update duals given observed voltage vector.

        Args:
            observed_voltages: Observed voltage magnitudes (pu), shape
                `(n_bus_phases,)`.

        Raises:
            ValueError: If `observed_voltages` length does not match the dual
                dimension.
        """
        observed_voltages = np.asarray(observed_voltages, float).reshape(-1)
        if observed_voltages.shape[0] != self.dual_undervoltage.shape[0]:
            raise ValueError(
                f"observed_voltages has len {observed_voltages.shape[0]} "
                f"but duals have len {self.dual_undervoltage.shape[0]}"
            )
        vmin = float(self.config.v_min)
        vmax = float(self.config.v_max)
        rho = float(self.config.ascent_step_size)
        self.dual_undervoltage = np.maximum(self.dual_undervoltage + rho * (vmin - observed_voltages), 0.0)
        self.dual_overvoltage = np.maximum(self.dual_overvoltage + rho * (observed_voltages - vmax), 0.0)

    def dual_difference(self) -> np.ndarray:
        """Return the voltage dual difference (η = λ̄ − λ, Appendix B)."""
        return self.dual_overvoltage - self.dual_undervoltage

`update(observed_voltages)` ¶

Update duals given observed voltage vector.

Parameters:

Name	Type	Description	Default
`observed_voltages`	`ndarray`	Observed voltage magnitudes (pu), shape `(n_bus_phases,)`.	required

Raises:

Type	Description
`ValueError`	If `observed_voltages` length does not match the dual dimension.

Source code in openg2g/controller/ofo.py

def update(self, observed_voltages: np.ndarray) -> None:
    """Update duals given observed voltage vector.

    Args:
        observed_voltages: Observed voltage magnitudes (pu), shape
            `(n_bus_phases,)`.

    Raises:
        ValueError: If `observed_voltages` length does not match the dual
            dimension.
    """
    observed_voltages = np.asarray(observed_voltages, float).reshape(-1)
    if observed_voltages.shape[0] != self.dual_undervoltage.shape[0]:
        raise ValueError(
            f"observed_voltages has len {observed_voltages.shape[0]} "
            f"but duals have len {self.dual_undervoltage.shape[0]}"
        )
    vmin = float(self.config.v_min)
    vmax = float(self.config.v_max)
    rho = float(self.config.ascent_step_size)
    self.dual_undervoltage = np.maximum(self.dual_undervoltage + rho * (vmin - observed_voltages), 0.0)
    self.dual_overvoltage = np.maximum(self.dual_overvoltage + rho * (observed_voltages - vmax), 0.0)

`dual_difference()` ¶

Return the voltage dual difference (η = λ̄ − λ, Appendix B).

Source code in openg2g/controller/ofo.py

def dual_difference(self) -> np.ndarray:
    """Return the voltage dual difference (η = λ̄ − λ, Appendix B)."""
    return self.dual_overvoltage - self.dual_undervoltage

`PrimalBatchOptimizer` ¶

Primal batch-size optimizer operating in log2 space.

Maintains continuous state x_i = log2(batch_i) per model and applies a gradient descent step using voltage duals, latency duals, and fitted power/latency/throughput curves.

Parameters:

Name	Type	Description	Default
`models`	`list[LLMInferenceModelSpec]`	Model specifications for each served model.	required
`feasible_batch_sizes`	`list[int]`	Allowed batch sizes (union across all models).	required
`power_fits`	`dict[str, LogisticModel]`	Per-model logistic fit for power vs log2(batch_size).	required
`latency_fits`	`dict[str, LogisticModel]`	Per-model logistic fit for latency vs log2(batch_size).	required
`throughput_fits`	`dict[str, LogisticModel]`	Per-model logistic fit for throughput vs log2(batch_size).	required
`config`	`PrimalConfig`	Primal optimizer configuration.	required

Source code in openg2g/controller/ofo.py

class PrimalBatchOptimizer:
    """Primal batch-size optimizer operating in log2 space.

    Maintains continuous state `x_i = log2(batch_i)` per model and applies
    a gradient descent step using voltage duals, latency duals, and fitted
    power/latency/throughput curves.

    Args:
        models: Model specifications for each served model.
        feasible_batch_sizes: Allowed batch sizes (union across all models).
        power_fits: Per-model logistic fit for power vs log2(batch_size).
        latency_fits: Per-model logistic fit for latency vs log2(batch_size).
        throughput_fits: Per-model logistic fit for throughput vs
            log2(batch_size).
        config: Primal optimizer configuration.
    """

    def __init__(
        self,
        *,
        models: list[LLMInferenceModelSpec],
        feasible_batch_sizes: list[int],
        power_fits: dict[str, LogisticModel],
        latency_fits: dict[str, LogisticModel],
        throughput_fits: dict[str, LogisticModel],
        config: PrimalConfig,
    ) -> None:
        self.models = list(models)
        self.feasible_batch_sizes = sorted({int(b) for b in feasible_batch_sizes})
        if not self.feasible_batch_sizes:
            raise ValueError("feasible_batch_sizes cannot be empty.")

        self.power_fits = power_fits
        self.latency_fits = latency_fits
        self.throughput_fits = throughput_fits
        self.config = config

        self.log_batch_size_min = math.log2(min(self.feasible_batch_sizes))
        self.log_batch_size_max = math.log2(max(self.feasible_batch_sizes))

        self.log_batch_size_by_model: dict[str, float] = {
            ms.model_label: float(self.log_batch_size_max) for ms in self.models
        }
        self.prev_log_batch_size_by_model: dict[str, float] = dict(self.log_batch_size_by_model)

        # Per-model throughput normalization: r_i(x_max) for a single replica
        self.throughput_max_by_model: dict[str, float] = {}
        b_max = int(max(self.feasible_batch_sizes))
        for ms in self.models:
            label = ms.model_label
            try:
                th_max = float(self.throughput_fits[label].eval(b_max))
            except Exception:
                th_max = float("nan")
            if (not np.isfinite(th_max)) or (th_max <= 0.0):
                th_max = 1.0
            self.throughput_max_by_model[label] = th_max

    def _clamp_log_batch_size(self, log_batch_size: float) -> float:
        return float(min(max(float(log_batch_size), self.log_batch_size_min), self.log_batch_size_max))

    def _discretize_batch(self, log_batch_size: float) -> int:
        b_cont = 2.0 ** float(log_batch_size)
        idx = bisect.bisect_left(self.feasible_batch_sizes, b_cont)
        candidates = []
        if idx > 0:
            candidates.append(self.feasible_batch_sizes[idx - 1])
        if idx < len(self.feasible_batch_sizes):
            candidates.append(self.feasible_batch_sizes[idx])
        return int(min(candidates, key=lambda bb: abs(bb - b_cont)))

    def init_from_batches(self, batch_init: dict[str, int]) -> None:
        """Initialize log-batch-size state from discrete batch sizes."""
        for ms in self.models:
            label = ms.model_label
            b = int(batch_init.get(label, max(self.feasible_batch_sizes)))
            log_batch_size = math.log2(max(b, 1))
            log_batch_size = self._clamp_log_batch_size(log_batch_size)
            self.log_batch_size_by_model[label] = float(log_batch_size)
            self.prev_log_batch_size_by_model[label] = float(log_batch_size)

    def step(
        self,
        *,
        voltage_dual_diff: np.ndarray,
        sensitivity_matrix: np.ndarray,
        phase_share_by_model: dict[str, np.ndarray],
        latency_dual_by_model: dict[str, float] | None = None,
        replica_count_by_model: dict[str, float] | None = None,
    ) -> dict[str, int]:
        """Primal gradient descent step.

        Args:
            voltage_dual_diff: Voltage dual difference vector
                (η = λ̄ − λ), shape `(n_bus_phases,)`.
            sensitivity_matrix: Voltage sensitivity matrix (H = dv/dp),
                shape `(n_bus_phases, 3)`.
            phase_share_by_model: Per-model normalized phase share vectors,
                shape `(3,)` each.
            latency_dual_by_model: Per-model latency dual variables (μ_i).
            replica_count_by_model: Per-model active replica counts (w_i).

        Returns:
            Next batch sizes per model.
        """
        voltage_dual_diff = np.asarray(voltage_dual_diff, float).reshape(-1)
        sensitivity_matrix = np.asarray(sensitivity_matrix, float)
        latency_dual_by_model = {} if latency_dual_by_model is None else dict(latency_dual_by_model)
        replica_count_by_model = {} if replica_count_by_model is None else dict(replica_count_by_model)

        step_size = float(self.config.descent_step_size)  # ρ_x
        w_throughput = float(self.config.w_throughput)
        w_switch = float(self.config.w_switch)
        voltage_gradient_scale = float(self.config.voltage_gradient_scale)

        batch_next: dict[str, int] = {}

        for ms in self.models:
            label = ms.model_label
            log_batch_size = float(self.log_batch_size_by_model[label])
            prev_log_batch_size = float(self.prev_log_batch_size_by_model.get(label, log_batch_size))

            replica_count = float(replica_count_by_model.get(label, 0.0))  # w_i
            if (not np.isfinite(replica_count)) or (replica_count < 0.0):
                replica_count = 0.0

            phase_share = np.asarray(  # e_i (phase-allocation weight, p.7)
                phase_share_by_model.get(label, np.array([1 / 3, 1 / 3, 1 / 3], dtype=float)),
                float,
            ).reshape(3)
            s = float(np.sum(phase_share))
            if (not np.isfinite(s)) or s <= 0.0:
                phase_share = np.array([1 / 3, 1 / 3, 1 / 3], dtype=float)
            else:
                phase_share = phase_share / s

            weighted_sensitivity = sensitivity_matrix @ phase_share  # H @ e_i
            voltage_gradient = float(voltage_dual_diff @ weighted_sensitivity)

            dPdx_1 = float(self.power_fits[label].deriv_wrt_x(log_batch_size))
            dLdx_1 = float(self.latency_fits[label].deriv_wrt_x(log_batch_size))
            dThdx_1 = float(self.throughput_fits[label].deriv_wrt_x(log_batch_size))

            dPdx_1_kw = dPdx_1 / 1000.0

            th_max = float(self.throughput_max_by_model.get(label, 1.0))
            if (not np.isfinite(th_max)) or (th_max <= 0.0):
                th_max = 1.0
            dThdx_norm_1 = dThdx_1 / th_max

            dPdx = replica_count * dPdx_1_kw
            dThdx = replica_count * dThdx_norm_1
            dLdx = dLdx_1

            latency_dual = float(latency_dual_by_model.get(label, 0.0))  # μ_i
            if (not np.isfinite(latency_dual)) or (latency_dual < 0.0):
                latency_dual = 0.0

            # Gradient of the Lagrangian w.r.t. x_i = log2(batch_i).
            # G2G paper Eq. 18: nabla_x L = -dR/dx (throughput)
            #                              + 2*gamma*(x - x_prev) (switching)
            #                              + eta^T H e_i dP/dx (voltage dual)
            #                              + mu_i * dL/dx (latency dual)
            # Implementation extensions: wT scaling on throughput,
            #                            k_v scaling on voltage term
            grad = 0.0
            grad -= w_throughput * dThdx
            grad += voltage_gradient_scale * voltage_gradient * dPdx
            grad += latency_dual * dLdx
            if w_switch > 0.0:
                grad += w_switch * (log_batch_size - prev_log_batch_size)

            new_log_batch_size = self._clamp_log_batch_size(log_batch_size - step_size * grad)
            self.prev_log_batch_size_by_model[label] = log_batch_size
            self.log_batch_size_by_model[label] = new_log_batch_size
            batch_next[label] = self._discretize_batch(new_log_batch_size)

        return batch_next

`init_from_batches(batch_init)` ¶

Initialize log-batch-size state from discrete batch sizes.

Source code in openg2g/controller/ofo.py

def init_from_batches(self, batch_init: dict[str, int]) -> None:
    """Initialize log-batch-size state from discrete batch sizes."""
    for ms in self.models:
        label = ms.model_label
        b = int(batch_init.get(label, max(self.feasible_batch_sizes)))
        log_batch_size = math.log2(max(b, 1))
        log_batch_size = self._clamp_log_batch_size(log_batch_size)
        self.log_batch_size_by_model[label] = float(log_batch_size)
        self.prev_log_batch_size_by_model[label] = float(log_batch_size)

`step(*, voltage_dual_diff, sensitivity_matrix, phase_share_by_model, latency_dual_by_model=None, replica_count_by_model=None)` ¶

Primal gradient descent step.

Parameters:

Name	Type	Description	Default
`voltage_dual_diff`	`ndarray`	Voltage dual difference vector (η = λ̄ − λ), shape `(n_bus_phases,)`.	required
`sensitivity_matrix`	`ndarray`	Voltage sensitivity matrix (H = dv/dp), shape `(n_bus_phases, 3)`.	required
`phase_share_by_model`	`dict[str, ndarray]`	Per-model normalized phase share vectors, shape `(3,)` each.	required
`latency_dual_by_model`	`dict[str, float] \| None`	Per-model latency dual variables (μ_i).	`None`
`replica_count_by_model`	`dict[str, float] \| None`	Per-model active replica counts (w_i).	`None`

Returns:

Type	Description
`dict[str, int]`	Next batch sizes per model.

Source code in openg2g/controller/ofo.py

def step(
    self,
    *,
    voltage_dual_diff: np.ndarray,
    sensitivity_matrix: np.ndarray,
    phase_share_by_model: dict[str, np.ndarray],
    latency_dual_by_model: dict[str, float] | None = None,
    replica_count_by_model: dict[str, float] | None = None,
) -> dict[str, int]:
    """Primal gradient descent step.

    Args:
        voltage_dual_diff: Voltage dual difference vector
            (η = λ̄ − λ), shape `(n_bus_phases,)`.
        sensitivity_matrix: Voltage sensitivity matrix (H = dv/dp),
            shape `(n_bus_phases, 3)`.
        phase_share_by_model: Per-model normalized phase share vectors,
            shape `(3,)` each.
        latency_dual_by_model: Per-model latency dual variables (μ_i).
        replica_count_by_model: Per-model active replica counts (w_i).

    Returns:
        Next batch sizes per model.
    """
    voltage_dual_diff = np.asarray(voltage_dual_diff, float).reshape(-1)
    sensitivity_matrix = np.asarray(sensitivity_matrix, float)
    latency_dual_by_model = {} if latency_dual_by_model is None else dict(latency_dual_by_model)
    replica_count_by_model = {} if replica_count_by_model is None else dict(replica_count_by_model)

    step_size = float(self.config.descent_step_size)  # ρ_x
    w_throughput = float(self.config.w_throughput)
    w_switch = float(self.config.w_switch)
    voltage_gradient_scale = float(self.config.voltage_gradient_scale)

    batch_next: dict[str, int] = {}

    for ms in self.models:
        label = ms.model_label
        log_batch_size = float(self.log_batch_size_by_model[label])
        prev_log_batch_size = float(self.prev_log_batch_size_by_model.get(label, log_batch_size))

        replica_count = float(replica_count_by_model.get(label, 0.0))  # w_i
        if (not np.isfinite(replica_count)) or (replica_count < 0.0):
            replica_count = 0.0

        phase_share = np.asarray(  # e_i (phase-allocation weight, p.7)
            phase_share_by_model.get(label, np.array([1 / 3, 1 / 3, 1 / 3], dtype=float)),
            float,
        ).reshape(3)
        s = float(np.sum(phase_share))
        if (not np.isfinite(s)) or s <= 0.0:
            phase_share = np.array([1 / 3, 1 / 3, 1 / 3], dtype=float)
        else:
            phase_share = phase_share / s

        weighted_sensitivity = sensitivity_matrix @ phase_share  # H @ e_i
        voltage_gradient = float(voltage_dual_diff @ weighted_sensitivity)

        dPdx_1 = float(self.power_fits[label].deriv_wrt_x(log_batch_size))
        dLdx_1 = float(self.latency_fits[label].deriv_wrt_x(log_batch_size))
        dThdx_1 = float(self.throughput_fits[label].deriv_wrt_x(log_batch_size))

        dPdx_1_kw = dPdx_1 / 1000.0

        th_max = float(self.throughput_max_by_model.get(label, 1.0))
        if (not np.isfinite(th_max)) or (th_max <= 0.0):
            th_max = 1.0
        dThdx_norm_1 = dThdx_1 / th_max

        dPdx = replica_count * dPdx_1_kw
        dThdx = replica_count * dThdx_norm_1
        dLdx = dLdx_1

        latency_dual = float(latency_dual_by_model.get(label, 0.0))  # μ_i
        if (not np.isfinite(latency_dual)) or (latency_dual < 0.0):
            latency_dual = 0.0

        # Gradient of the Lagrangian w.r.t. x_i = log2(batch_i).
        # G2G paper Eq. 18: nabla_x L = -dR/dx (throughput)
        #                              + 2*gamma*(x - x_prev) (switching)
        #                              + eta^T H e_i dP/dx (voltage dual)
        #                              + mu_i * dL/dx (latency dual)
        # Implementation extensions: wT scaling on throughput,
        #                            k_v scaling on voltage term
        grad = 0.0
        grad -= w_throughput * dThdx
        grad += voltage_gradient_scale * voltage_gradient * dPdx
        grad += latency_dual * dLdx
        if w_switch > 0.0:
            grad += w_switch * (log_batch_size - prev_log_batch_size)

        new_log_batch_size = self._clamp_log_batch_size(log_batch_size - step_size * grad)
        self.prev_log_batch_size_by_model[label] = log_batch_size
        self.log_batch_size_by_model[label] = new_log_batch_size
        batch_next[label] = self._discretize_batch(new_log_batch_size)

    return batch_next

`OFOBatchController` ¶

Bases: Controller[LLMBatchSizeControlledDatacenter[LLMDatacenterState], OpenDSSGrid]

Online Feedback Optimization controller for batch-size regulation.

Reads grid voltage and datacenter state, updates voltage and latency duals, runs the primal batch-size optimizer, and returns new batch sizes. Latency dual updates use dc_state.observed_itl_s_by_model.

Parameters:

Name	Type	Description	Default
`models`	`list[LLMInferenceModelSpec]`	Model specifications.	required
`power_fits`	`dict[str, LogisticModel]`	Per-model logistic fit for power as a function of log2(batch_size).	required
`latency_fits`	`dict[str, LogisticModel]`	Per-model logistic fit for latency as a function of log2(batch_size).	required
`throughput_fits`	`dict[str, LogisticModel]`	Per-model logistic fit for throughput as a function of log2(batch_size).	required
`itl_deadline_by_model`	`dict[str, float]`	Per-model latency threshold (seconds).	required
`primal_config`	`PrimalConfig`	Primal optimizer configuration.	required
`voltage_dual_config`	`VoltageDualConfig`	Voltage dual configuration (v_min, v_max, ascent_step_size).	required
`feasible_batch_sizes`	`list[int]`	Allowed batch sizes.	required
`latency_dual_step_size`	`float`	Latency dual step size (ρ_l).	`1.0`
`dt_s`	`Fraction`	Control interval (seconds).	`Fraction(1)`
`sensitivity_update_interval`	`int`	Re-estimate sensitivity every N control steps (0 = only once at init).	`0`
`sensitivity_perturbation_kw`	`float`	Perturbation size for sensitivity estimation.	`100.0`

Source code in openg2g/controller/ofo.py

class OFOBatchController(Controller[LLMBatchSizeControlledDatacenter[LLMDatacenterState], OpenDSSGrid]):
    """Online Feedback Optimization controller for batch-size regulation.

    Reads grid voltage and datacenter state, updates voltage and latency
    duals, runs the primal batch-size optimizer, and returns new batch sizes.
    Latency dual updates use `dc_state.observed_itl_s_by_model`.

    Args:
        models: Model specifications.
        power_fits: Per-model logistic fit for power as a function of
            log2(batch_size).
        latency_fits: Per-model logistic fit for latency as a function of
            log2(batch_size).
        throughput_fits: Per-model logistic fit for throughput as a function
            of log2(batch_size).
        itl_deadline_by_model: Per-model latency threshold (seconds).
        primal_config: Primal optimizer configuration.
        voltage_dual_config: Voltage dual configuration (v_min, v_max,
            ascent_step_size).
        feasible_batch_sizes: Allowed batch sizes.
        latency_dual_step_size: Latency dual step size (ρ_l).
        dt_s: Control interval (seconds).
        sensitivity_update_interval: Re-estimate sensitivity every N control
            steps (0 = only once at init).
        sensitivity_perturbation_kw: Perturbation size for sensitivity
            estimation.
    """

    def __init__(
        self,
        *,
        models: list[LLMInferenceModelSpec],
        power_fits: dict[str, LogisticModel],
        latency_fits: dict[str, LogisticModel],
        throughput_fits: dict[str, LogisticModel],
        itl_deadline_by_model: dict[str, float],
        primal_config: PrimalConfig,
        voltage_dual_config: VoltageDualConfig,
        feasible_batch_sizes: list[int],
        latency_dual_step_size: float = 1.0,
        dt_s: Fraction = Fraction(1),
        sensitivity_update_interval: int = 0,
        sensitivity_perturbation_kw: float = 100.0,
    ) -> None:
        self._dt_s = dt_s
        self._models = list(models)
        self._itl_deadline_by_model = dict(itl_deadline_by_model)
        self._latency_dual_step_size = float(latency_dual_step_size)  # ρ_l
        self._sensitivity_update_interval = int(sensitivity_update_interval)
        self._sensitivity_perturbation_kw = float(sensitivity_perturbation_kw)

        # Voltage duals are initialized lazily once voltage feature is available.
        self._voltage_dual: VoltageDualVariables | None = None
        self._voltage_dual_config = voltage_dual_config

        # Latency duals (μ_i per model, G2G paper Eq. 7)
        self._latency_dual_by_model: dict[str, float] = {ms.model_label: 0.0 for ms in models}

        # Primal optimizer
        self._optimizer = PrimalBatchOptimizer(
            models=models,
            feasible_batch_sizes=feasible_batch_sizes,
            power_fits=power_fits,
            latency_fits=latency_fits,
            throughput_fits=throughput_fits,
            config=primal_config,
        )
        self._optimizer.init_from_batches({ms.model_label: ms.initial_batch_size for ms in models})

        # Sensitivity estimation state (H = ∂v/∂p, G2G paper Eq. 13)
        self._sensitivity_matrix: np.ndarray | None = None
        self._control_step_count: int = 0

        logger.info(
            "OFOBatchController: %d models, dt=%s s, feasible_batches=%s",
            len(models),
            dt_s,
            feasible_batch_sizes,
        )

    def reset(self) -> None:
        self._voltage_dual = None
        self._latency_dual_by_model = {ms.model_label: 0.0 for ms in self._models}
        self._optimizer.init_from_batches({ms.model_label: ms.initial_batch_size for ms in self._models})
        self._sensitivity_matrix = None
        self._control_step_count = 0

    @classmethod
    def from_workload(
        cls,
        *,
        workload: LLMInferenceWorkload,
        power_fits: dict[str, LogisticModel],
        latency_fits: dict[str, LogisticModel],
        throughput_fits: dict[str, LogisticModel],
        primal_config: PrimalConfig,
        voltage_dual_config: VoltageDualConfig,
        latency_dual_step_size: float = 1.0,
        dt_s: Fraction = Fraction(1),
        sensitivity_update_interval: int = 0,
        sensitivity_perturbation_kw: float = 100.0,
    ) -> OFOBatchController:
        """Create an OFO controller from an LLMInferenceWorkload.

        Derives `feasible_batch_sizes` and `itl_deadline_by_model`
        from the workload's model specs.

        Args:
            workload: LLM workload specification.
            power_fits: Per-model logistic fit for power.
            latency_fits: Per-model logistic fit for latency.
            throughput_fits: Per-model logistic fit for throughput.
            primal_config: Primal optimizer configuration.
            voltage_dual_config: Voltage dual configuration.
            latency_dual_step_size: Latency dual step size (ρ_l).
            dt_s: Control interval (seconds).
            sensitivity_update_interval: Re-estimate sensitivity every N
                control steps.
            sensitivity_perturbation_kw: Perturbation size for sensitivity
                estimation.
        """
        return cls(
            models=list(workload.models),
            power_fits=power_fits,
            latency_fits=latency_fits,
            throughput_fits=throughput_fits,
            itl_deadline_by_model=workload.itl_deadline_by_model,
            primal_config=primal_config,
            voltage_dual_config=voltage_dual_config,
            feasible_batch_sizes=workload.feasible_batch_sizes_union,
            latency_dual_step_size=latency_dual_step_size,
            dt_s=dt_s,
            sensitivity_update_interval=sensitivity_update_interval,
            sensitivity_perturbation_kw=sensitivity_perturbation_kw,
        )

    @property
    def dt_s(self) -> Fraction:
        return self._dt_s

    @property
    def voltage_dual(self) -> VoltageDualVariables:
        if self._voltage_dual is None:
            raise RuntimeError("Voltage dual not initialized yet.")
        return self._voltage_dual

    @property
    def latency_dual_by_model(self) -> dict[str, float]:
        return dict(self._latency_dual_by_model)

    def step(
        self,
        clock: SimulationClock,
        datacenter: LLMBatchSizeControlledDatacenter[LLMDatacenterState],
        grid: OpenDSSGrid,
        events: EventEmitter,
    ) -> ControlAction:

        if self._voltage_dual is None:
            self._voltage_dual = VoltageDualVariables(len(grid.v_index), self._voltage_dual_config)

        # 1. Re-estimate sensitivity if needed
        if self._sensitivity_matrix is None or (
            self._sensitivity_update_interval > 0 and self._control_step_count % self._sensitivity_update_interval == 0
        ):
            self._sensitivity_matrix, _ = grid.estimate_sensitivity(self._sensitivity_perturbation_kw)

        # 2. Update voltage duals from grid state
        observed_voltages = grid.voltages_vector()
        self._voltage_dual.update(observed_voltages)

        voltage_dual_diff = self._voltage_dual.dual_difference()  # η = λ̄ − λ

        # 3. Read observed latency from datacenter and update latency duals
        dc_state = datacenter.state
        missing_replicas = [
            ms.model_label for ms in self._models if ms.model_label not in dc_state.active_replicas_by_model
        ]
        if missing_replicas:
            miss = ", ".join(sorted(missing_replicas))
            raise RuntimeError(f"OFOBatchController requires active_replicas_by_model for all models. Missing: {miss}.")
        missing_itl = [ms.model_label for ms in self._models if ms.model_label not in dc_state.observed_itl_s_by_model]
        if missing_itl:
            miss = ", ".join(sorted(missing_itl))
            raise RuntimeError(f"OFOBatchController requires observed_itl_s_by_model for all models. Missing: {miss}.")
        for ms in self._models:
            label = ms.model_label
            num_replicas = max(int(dc_state.active_replicas_by_model[label]), 0)
            observed_itl = float(dc_state.observed_itl_s_by_model[label])
            if num_replicas <= 0:
                logger.debug("Model %s has 0 replicas, skipping latency dual update", label)
                observed_itl = float("nan")

            deadline = float(self._itl_deadline_by_model[label])
            if np.isfinite(observed_itl):
                self._latency_dual_by_model[label] = max(
                    self._latency_dual_by_model[label] + self._latency_dual_step_size * (observed_itl - deadline),
                    0.0,
                )
            else:
                self._latency_dual_by_model[label] = max(self._latency_dual_by_model[label], 0.0)

        # 4. Compute replica counts
        replica_count_by_model: dict[str, float] = {}
        for ms in self._models:
            label = ms.model_label
            replica_count_by_model[label] = float(dc_state.active_replicas_by_model[label])

        # 5. Primal update -> next batch sizes
        batch_next = self._optimizer.step(
            voltage_dual_diff=voltage_dual_diff,
            sensitivity_matrix=self._sensitivity_matrix,
            phase_share_by_model=datacenter.phase_share_by_model,
            latency_dual_by_model=self._latency_dual_by_model,
            replica_count_by_model=replica_count_by_model,
        )

        self._control_step_count += 1
        logger.info(
            "OFO step %d (t=%.1f s): batch=%s",
            self._control_step_count,
            clock.time_s,
            batch_next,
        )
        return ControlAction(commands=[SetBatchSize(batch_size_by_model=batch_next)])

`from_workload(*, workload, power_fits, latency_fits, throughput_fits, primal_config, voltage_dual_config, latency_dual_step_size=1.0, dt_s=Fraction(1), sensitivity_update_interval=0, sensitivity_perturbation_kw=100.0)` `classmethod` ¶

Create an OFO controller from an LLMInferenceWorkload.

Derives feasible_batch_sizes and itl_deadline_by_model from the workload's model specs.

Parameters:

Name	Type	Description	Default
`workload`	`LLMInferenceWorkload`	LLM workload specification.	required
`power_fits`	`dict[str, LogisticModel]`	Per-model logistic fit for power.	required
`latency_fits`	`dict[str, LogisticModel]`	Per-model logistic fit for latency.	required
`throughput_fits`	`dict[str, LogisticModel]`	Per-model logistic fit for throughput.	required
`primal_config`	`PrimalConfig`	Primal optimizer configuration.	required
`voltage_dual_config`	`VoltageDualConfig`	Voltage dual configuration.	required
`latency_dual_step_size`	`float`	Latency dual step size (ρ_l).	`1.0`
`dt_s`	`Fraction`	Control interval (seconds).	`Fraction(1)`
`sensitivity_update_interval`	`int`	Re-estimate sensitivity every N control steps.	`0`
`sensitivity_perturbation_kw`	`float`	Perturbation size for sensitivity estimation.	`100.0`

Source code in openg2g/controller/ofo.py

@classmethod
def from_workload(
    cls,
    *,
    workload: LLMInferenceWorkload,
    power_fits: dict[str, LogisticModel],
    latency_fits: dict[str, LogisticModel],
    throughput_fits: dict[str, LogisticModel],
    primal_config: PrimalConfig,
    voltage_dual_config: VoltageDualConfig,
    latency_dual_step_size: float = 1.0,
    dt_s: Fraction = Fraction(1),
    sensitivity_update_interval: int = 0,
    sensitivity_perturbation_kw: float = 100.0,
) -> OFOBatchController:
    """Create an OFO controller from an LLMInferenceWorkload.

    Derives `feasible_batch_sizes` and `itl_deadline_by_model`
    from the workload's model specs.

    Args:
        workload: LLM workload specification.
        power_fits: Per-model logistic fit for power.
        latency_fits: Per-model logistic fit for latency.
        throughput_fits: Per-model logistic fit for throughput.
        primal_config: Primal optimizer configuration.
        voltage_dual_config: Voltage dual configuration.
        latency_dual_step_size: Latency dual step size (ρ_l).
        dt_s: Control interval (seconds).
        sensitivity_update_interval: Re-estimate sensitivity every N
            control steps.
        sensitivity_perturbation_kw: Perturbation size for sensitivity
            estimation.
    """
    return cls(
        models=list(workload.models),
        power_fits=power_fits,
        latency_fits=latency_fits,
        throughput_fits=throughput_fits,
        itl_deadline_by_model=workload.itl_deadline_by_model,
        primal_config=primal_config,
        voltage_dual_config=voltage_dual_config,
        feasible_batch_sizes=workload.feasible_batch_sizes_union,
        latency_dual_step_size=latency_dual_step_size,
        dt_s=dt_s,
        sensitivity_update_interval=sensitivity_update_interval,
        sensitivity_perturbation_kw=sensitivity_perturbation_kw,
    )

`start()` ¶

Acquire per-run resources.

Called after reset(), before the simulation loop. No-op by default because most controllers have no resources to acquire.

Source code in openg2g/controller/base.py

def start(self) -> None:
    """Acquire per-run resources.

    Called after `reset()`, before the simulation loop. No-op by
    default because most controllers have no resources to acquire.
    """

`stop()` ¶

Release per-run resources. Simulation state is preserved.

Called after the simulation loop in LIFO order. No-op by default.

Source code in openg2g/controller/base.py

def stop(self) -> None:
    """Release per-run resources. Simulation state is preserved.

    Called after the simulation loop in LIFO order. No-op by default.
    """

`openg2g.controller.tap_schedule` ¶

Tap schedule controller: applies pre-defined regulator tap changes at specified times.

`TapScheduleController` ¶

Bases: Controller[DatacenterBackend, GridBackend]

Applies pre-defined tap changes at scheduled times.

Parameters:

Name	Type	Description	Default
`schedule`	`TapSchedule`	Tap schedule built via `TapPosition(...).at(t=...) \| ...`.	required
`dt_s`	`Fraction`	How often the controller checks the schedule (seconds).	`Fraction(1)`

Source code in openg2g/controller/tap_schedule.py

class TapScheduleController(Controller[DatacenterBackend, GridBackend]):
    """Applies pre-defined tap changes at scheduled times.

    Args:
        schedule: Tap schedule built via `TapPosition(...).at(t=...) | ...`.
        dt_s: How often the controller checks the schedule (seconds).
    """

    def __init__(
        self,
        *,
        schedule: TapSchedule,
        dt_s: Fraction = Fraction(1),
    ) -> None:
        self._dt_s = dt_s
        self._entries = list(schedule)
        self._idx = 0

    def reset(self) -> None:
        self._idx = 0

    @property
    def dt_s(self) -> Fraction:
        return self._dt_s

    def step(
        self,
        clock: SimulationClock,
        datacenter: DatacenterBackend,
        grid: GridBackend,
        events: EventEmitter,
    ) -> ControlAction:

        t_now = clock.time_s
        merged_a: float | None = None
        merged_b: float | None = None
        merged_c: float | None = None
        any_fired = False

        while self._idx < len(self._entries):
            t_ev, pos = self._entries[self._idx]
            if float(t_ev) <= t_now + 1e-12:
                if pos.a is not None:
                    merged_a = pos.a
                if pos.b is not None:
                    merged_b = pos.b
                if pos.c is not None:
                    merged_c = pos.c
                any_fired = True
                self._idx += 1
            else:
                break

        if any_fired and (merged_a is not None or merged_b is not None or merged_c is not None):
            return ControlAction(commands=[SetTaps(tap_position=TapPosition(a=merged_a, b=merged_b, c=merged_c))])
        return ControlAction(commands=[])

`start()` ¶

Acquire per-run resources.

Called after reset(), before the simulation loop. No-op by default because most controllers have no resources to acquire.

Source code in openg2g/controller/base.py

def start(self) -> None:
    """Acquire per-run resources.

    Called after `reset()`, before the simulation loop. No-op by
    default because most controllers have no resources to acquire.
    """

`stop()` ¶

Release per-run resources. Simulation state is preserved.

Called after the simulation loop in LIFO order. No-op by default.

Source code in openg2g/controller/base.py

def stop(self) -> None:
    """Release per-run resources. Simulation state is preserved.

    Called after the simulation loop in LIFO order. No-op by default.
    """

openg2g.controller¶

openg2g.controller.base ¶

Controller ¶

dt_s abstractmethod property ¶

reset() abstractmethod ¶

start() ¶

stop() ¶

step(clock, datacenter, grid, events) abstractmethod ¶

openg2g.controller.batch_size_schedule ¶

BatchSizeChange dataclass ¶

at(t) ¶

BatchSizeSchedule ¶

BatchSizeScheduleController ¶

start() ¶

stop() ¶

openg2g.controller.noop ¶

NoopController ¶

start() ¶

stop() ¶

openg2g.controller.ofo ¶

VoltageDualConfig dataclass ¶

PrimalConfig dataclass ¶

VoltageDualVariables ¶

update(observed_voltages) ¶

dual_difference() ¶

PrimalBatchOptimizer ¶

init_from_batches(batch_init) ¶

step(*, voltage_dual_diff, sensitivity_matrix, phase_share_by_model, latency_dual_by_model=None, replica_count_by_model=None) ¶

OFOBatchController ¶

from_workload(*, workload, power_fits, latency_fits, throughput_fits, primal_config, voltage_dual_config, latency_dual_step_size=1.0, dt_s=Fraction(1), sensitivity_update_interval=0, sensitivity_perturbation_kw=100.0) classmethod ¶

start() ¶

stop() ¶

openg2g.controller.tap_schedule ¶

TapScheduleController ¶

start() ¶

stop() ¶

`openg2g.controller.base` ¶

`Controller` ¶

`dt_s` `abstractmethod` `property` ¶

`reset()` `abstractmethod` ¶

`start()` ¶

`stop()` ¶

`step(clock, datacenter, grid, events)` `abstractmethod` ¶

`openg2g.controller.batch_size_schedule` ¶

`BatchSizeChange` `dataclass` ¶

`at(t)` ¶

`BatchSizeSchedule` ¶

`BatchSizeScheduleController` ¶

`start()` ¶

`stop()` ¶

`openg2g.controller.noop` ¶

`NoopController` ¶

`start()` ¶

`stop()` ¶

`openg2g.controller.ofo` ¶

`VoltageDualConfig` `dataclass` ¶

`PrimalConfig` `dataclass` ¶

`VoltageDualVariables` ¶

`update(observed_voltages)` ¶

`dual_difference()` ¶

`PrimalBatchOptimizer` ¶

`init_from_batches(batch_init)` ¶

`step(*, voltage_dual_diff, sensitivity_matrix, phase_share_by_model, latency_dual_by_model=None, replica_count_by_model=None)` ¶

`OFOBatchController` ¶

`from_workload(*, workload, power_fits, latency_fits, throughput_fits, primal_config, voltage_dual_config, latency_dual_step_size=1.0, dt_s=Fraction(1), sensitivity_update_interval=0, sensitivity_perturbation_kw=100.0)` `classmethod` ¶

`start()` ¶

`stop()` ¶

`openg2g.controller.tap_schedule` ¶

`TapScheduleController` ¶

`start()` ¶

`stop()` ¶