metrics

`optimus_dl.modules.metrics.metrics` ¶

`AccuracyMetric` ¶

Bases: Metric

Computes Top-1 accuracy for classification tasks.

Source code in optimus_dl/modules/metrics/metrics.py

@register_metric("accuracy", AccuracyMetricConfig)
class AccuracyMetric(Metric):
    """Computes Top-1 accuracy for classification tasks."""

    @property
    def requires(self) -> set[str]:
        return {StandardProtocols.CLASSIFICATION}

    @property
    def accumulators(self) -> dict[str, str]:
        return {"accuracy": "average", "total": "sum"}

    def __call__(
        self, sources_data: dict[str, dict[str, Any]]
    ) -> dict[str, dict[str, Any]]:
        data = sources_data.get(StandardProtocols.CLASSIFICATION)
        if not data:
            return {}

        preds = data["predictions"]
        targets = data["targets"]
        mask = data.get("mask")

        correct = preds == targets
        if mask is not None:
            correct = correct & mask
            total = mask.sum().item()
        else:
            total = targets.numel()

        if total == 0:
            return {}

        return {
            "accuracy": {"value": correct.sum().item() / total, "weight": total},
            "total": {"value": total},
        }

`AccuracyMetricConfig` `dataclass` ¶

Bases: MetricConfig

AccuracyMetricConfig(_name: 'str' = 'accuracy', nested_name: 'str | None' = None)

Source code in optimus_dl/modules/metrics/metrics.py

@dataclass
class AccuracyMetricConfig(MetricConfig):
    _name: str = "accuracy"

`LossMetric` ¶

Bases: Metric

Simple wrapper to report loss via MetricEngine.

Source code in optimus_dl/modules/metrics/metrics.py

@register_metric("loss", LossMetricConfig)
class LossMetric(Metric):
    """Simple wrapper to report loss via MetricEngine."""

    @property
    def requires(self) -> set[str]:
        return {StandardProtocols.LOSS}

    @property
    def accumulators(self) -> dict[str, str]:
        return {"loss": "average"}

    def __call__(
        self, sources_data: dict[str, dict[str, Any]]
    ) -> dict[str, dict[str, Any]]:
        loss = sources_data.get(StandardProtocols.LOSS)
        if loss is None:
            return {}

        weight = 1.0
        classif = sources_data.get(StandardProtocols.CLASSIFICATION)
        if classif and "mask" in classif:
            weight = classif["mask"].sum().item()

        return {
            "loss": {
                "value": loss.item() if hasattr(loss, "item") else loss,
                "weight": weight,
            }
        }

`LossMetricConfig` `dataclass` ¶

Bases: MetricConfig

LossMetricConfig(_name: 'str' = 'loss', nested_name: 'str | None' = None)

Source code in optimus_dl/modules/metrics/metrics.py

@dataclass
class LossMetricConfig(MetricConfig):
    _name: str = "loss"

`Metric` ¶

Bases: ABC

Stateless definition for computing metrics from model/source data.

A Metric implementation defines: - What data it requires via requires mapping (Role -> set of protocol strings). - How to calculate raw results for a batch, potentially emitting multiple sub-values. - How to finalize those values after they've been aggregated (e.g., F1 from counts).

Source code in optimus_dl/modules/metrics/metrics.py

class Metric(ABC):
    """Stateless definition for computing metrics from model/source data.

    A Metric implementation defines:
    - What data it requires via `requires` mapping (Role -> set of protocol strings).
    - How to calculate raw results for a batch, potentially emitting multiple sub-values.
    - How to finalize those values after they've been aggregated (e.g., F1 from counts).
    """

    def __init__(self, cfg: MetricConfig):
        self.cfg = cfg
        self.nested_name = cfg.nested_name

    @property
    @abstractmethod
    def requires(self) -> set[str]:
        """Mapping from source role name to a set of required protocol strings."""
        raise NotImplementedError

    @property
    def accumulators(self) -> dict[str, str]:
        """Define how each sub-metric should be aggregated across batches.

        Returns a mapping from sub-metric names to accumulator types
        (e.g., 'average', 'sum', 'gather', 'perplexity').
        """
        return {self.cfg._name: "average"}

    @abstractmethod
    def __call__(
        self, sources_data: dict[str, dict[str, Any]]
    ) -> dict[str, dict[str, Any]]:
        """Compute raw metric values for the batch.

        Args:
            batch: The original batch dictionary.
            sources_data: Protocol string -> data.

        Returns:
            Dict mapping sub-metric names to log kwargs (e.g., {'value': ..., 'weight': ...})
            for accumulators.
        """
        raise NotImplementedError

    def finalize(self, aggregated_data: dict[str, Any]) -> dict[str, Any]:
        """Perform final calculations on aggregated data.

        Args:
            aggregated_data: Dict mapping sub-metric names to their
                computed/aggregated values from accumulators.

        Returns:
            Dict of final metrics to be logged/reported.
        """
        return {k: v for k, v in aggregated_data.items() if not k.startswith("_")}

`accumulators` `property` ¶

Define how each sub-metric should be aggregated across batches.

Returns a mapping from sub-metric names to accumulator types (e.g., 'average', 'sum', 'gather', 'perplexity').

`requires` `abstractmethod` `property` ¶

Mapping from source role name to a set of required protocol strings.

`call(sources_data)` `abstractmethod` ¶

Compute raw metric values for the batch.

Parameters:

Name	Type	Description	Default
`batch`		The original batch dictionary.	required
`sources_data`	`dict[str, dict[str, Any]]`	Protocol string -> data.	required

Returns:

Type	Description
`dict[str, dict[str, Any]]`	Dict mapping sub-metric names to log kwargs (e.g., {'value': ..., 'weight': ...})
`dict[str, dict[str, Any]]`	for accumulators.

Source code in optimus_dl/modules/metrics/metrics.py

@abstractmethod
def __call__(
    self, sources_data: dict[str, dict[str, Any]]
) -> dict[str, dict[str, Any]]:
    """Compute raw metric values for the batch.

    Args:
        batch: The original batch dictionary.
        sources_data: Protocol string -> data.

    Returns:
        Dict mapping sub-metric names to log kwargs (e.g., {'value': ..., 'weight': ...})
        for accumulators.
    """
    raise NotImplementedError

`finalize(aggregated_data)` ¶

Perform final calculations on aggregated data.

Parameters:

Name	Type	Description	Default
`aggregated_data`	`dict[str, Any]`	Dict mapping sub-metric names to their computed/aggregated values from accumulators.	required

Returns:

Type	Description
`dict[str, Any]`	Dict of final metrics to be logged/reported.

Source code in optimus_dl/modules/metrics/metrics.py

def finalize(self, aggregated_data: dict[str, Any]) -> dict[str, Any]:
    """Perform final calculations on aggregated data.

    Args:
        aggregated_data: Dict mapping sub-metric names to their
            computed/aggregated values from accumulators.

    Returns:
        Dict of final metrics to be logged/reported.
    """
    return {k: v for k, v in aggregated_data.items() if not k.startswith("_")}

`MetricConfig` `dataclass` ¶

Bases: RegistryConfigStrict

MetricConfig(_name: str | None = None, nested_name: 'str | None' = None)

Parameters:

Name	Type	Description	Default
`nested_name`	`str \| None`	Optional name to nest this metric under in the metrics tree.	`None`

Source code in optimus_dl/modules/metrics/metrics.py

@dataclass
class MetricConfig(RegistryConfigStrict):
    nested_name: str | None = field(
        default=None,
        metadata={
            "description": "Optional name to nest this metric under in the metrics tree."
        },
    )

`PerplexityMetric` ¶

Bases: Metric

Computes perplexity (exp(loss)).

Source code in optimus_dl/modules/metrics/metrics.py

@register_metric("perplexity", PerplexityMetricConfig)
class PerplexityMetric(Metric):
    """Computes perplexity (exp(loss))."""

    @property
    def requires(self) -> set[str]:
        return {StandardProtocols.LOSS}

    @property
    def accumulators(self) -> dict[str, str]:
        return {"perplexity": "perplexity"}

    def __call__(
        self, sources_data: dict[str, dict[str, Any]]
    ) -> dict[str, dict[str, Any]]:
        loss = sources_data.get(StandardProtocols.LOSS)
        if loss is None:
            return {}

        weight = 1.0
        classif = sources_data.get(StandardProtocols.CLASSIFICATION)
        if classif and "mask" in classif:
            weight = classif["mask"].sum().item()

        return {
            "perplexity": {
                "value": loss.item() if hasattr(loss, "item") else loss,
                "weight": weight,
            }
        }

`PerplexityMetricConfig` `dataclass` ¶

Bases: MetricConfig

PerplexityMetricConfig(_name: 'str' = 'perplexity', nested_name: 'str | None' = None)

Source code in optimus_dl/modules/metrics/metrics.py

@dataclass
class PerplexityMetricConfig(MetricConfig):
    _name: str = "perplexity"

metrics

optimus_dl.modules.metrics.metrics ¶

AccuracyMetric ¶

AccuracyMetricConfig dataclass ¶

LossMetric ¶

LossMetricConfig dataclass ¶

Metric ¶

accumulators property ¶

requires abstractmethod property ¶

__call__(sources_data) abstractmethod ¶

finalize(aggregated_data) ¶

MetricConfig dataclass ¶

PerplexityMetric ¶

PerplexityMetricConfig dataclass ¶

`optimus_dl.modules.metrics.metrics` ¶

`AccuracyMetric` ¶

`AccuracyMetricConfig` `dataclass` ¶

`LossMetric` ¶

`LossMetricConfig` `dataclass` ¶

`Metric` ¶

`accumulators` `property` ¶

`requires` `abstractmethod` `property` ¶

`call(sources_data)` `abstractmethod` ¶

`finalize(aggregated_data)` ¶

`MetricConfig` `dataclass` ¶

`PerplexityMetric` ¶

`PerplexityMetricConfig` `dataclass` ¶