Source code for eclypse.policies.replay.replay_nodes

"""Replay node attributes from records."""

from __future__ import annotations

from dataclasses import dataclass
from typing import (
    TYPE_CHECKING,
    Any,
)

from eclypse.policies._helpers import validate_missing_behaviour
from eclypse.policies.replay._helpers import (
    group_records_by_step,
    infer_value_columns,
    initial_step,
    normalise_records,
    resolve_replay_step,
)

if TYPE_CHECKING:
    from eclypse.graph.asset_graph import AssetGraph
    from eclypse.policies._filters import NodeFilter
    from eclypse.utils.types import (
        MissingPolicyBehaviour,
        UpdatePolicy,
    )


@dataclass(slots=True)
class ReplayNodesPolicy:
    """Replay node attributes from time-indexed records."""

    records_by_step: dict[int, list[dict[str, Any]]]
    columns: list[str]
    node_id_column: str = "node_id"
    selected_node_ids: set[str] | None = None
    node_filter: NodeFilter | None = None
    missing: MissingPolicyBehaviour = "ignore"
    cyclic: bool = False
    current_step: int = 0

    def __call__(self, graph: AssetGraph):
        """Apply the replay records for the current step to matching nodes."""
        replay_step = resolve_replay_step(
            self.records_by_step,
            self.current_step,
            cyclic=self.cyclic,
        )
        for record in self.records_by_step.get(replay_step, []):
            _update_node_from_record(
                graph,
                record,
                columns=self.columns,
                node_id_column=self.node_id_column,
                selected_node_ids=self.selected_node_ids,
                node_filter=self.node_filter,
                missing=self.missing,
            )

        graph.logger.trace(f"Applied replay_nodes policy for step {replay_step}.")
        self.current_step += 1


[docs] def replay_nodes( record_source, *, node_id_column: str = "node_id", time_column: str = "time", value_columns: list[str] | tuple[str, ...] | None = None, node_ids: list[str] | None = None, node_filter: NodeFilter | None = None, missing: MissingPolicyBehaviour = "ignore", start_step: int | None = None, cyclic: bool = False, ) -> UpdatePolicy: """Replay node attributes from time-indexed records. Args: record_source (Any): Iterable of mapping records to replay. node_id_column (str): Column containing node identifiers. time_column (str): Column containing replay steps. value_columns (list[str] | tuple[str, ...] | None): Optional explicit columns to copy from records. node_ids (list[str] | None): Optional explicit node identifiers to mutate. node_filter (NodeFilter | None): Optional predicate receiving ``(node_id, data)``. missing (MissingPolicyBehaviour): Behaviour when a replay record targets a missing node. start_step (int | None): Optional starting replay step. cyclic (bool): Whether to wrap past the final available replay step. Returns: Stateful node replay policy. """ validate_missing_behaviour(missing) records = normalise_records(record_source) columns = infer_value_columns( records, reserved_columns=[node_id_column, time_column], value_columns=value_columns, ) records_by_step = group_records_by_step(records, time_column=time_column) selected_node_ids = set(node_ids) if node_ids is not None else None current_step = initial_step(records_by_step, start_step) return ReplayNodesPolicy( records_by_step=records_by_step, columns=columns, node_id_column=node_id_column, selected_node_ids=selected_node_ids, node_filter=node_filter, missing=missing, cyclic=cyclic, current_step=current_step, )
def _update_node_from_record( graph: AssetGraph, record, *, columns: list[str], node_id_column: str, selected_node_ids: set[str] | None, node_filter, missing: MissingPolicyBehaviour, ): node_id = record[node_id_column] if selected_node_ids is not None and node_id not in selected_node_ids: return if not graph.has_node(node_id): if missing == "error": raise KeyError(f'Node "{node_id}" not found in the graph.') return data = graph.nodes[node_id] if node_filter is not None and not node_filter(node_id, data): return for column in columns: if column in record: data[column] = record[column]