Skip to content

Collection

MetricCollection

Bases: Metric, Generic[T]

A metric that aggregates multiple sub-metrics.

Parameters:

Name Type Description Default
metrics dict[str, T] | None

A dictionary mapping metric names to Metric instances.

None
Source code in src/kibad_llm/metrics/collection.py
 9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
class MetricCollection(Metric, Generic[T]):
    """A metric that aggregates multiple sub-metrics.

    Args:
        metrics: A dictionary mapping metric names to Metric instances.
    """

    def __init__(self, metrics: dict[str, T] | None = None, sort_fields: bool = False) -> None:
        super().__init__()
        self.metrics: dict[str, T] = metrics or dict()
        self.sort_fields = sort_fields

    def add_metric(self, name: str, metric: T) -> None:
        """Adds a new metric to the collection."""
        if name in self.metrics:
            raise ValueError(f"Metric {name} already exists")
        self.metrics[name] = metric

    def reset(self) -> None:
        """Resets all sub-metrics."""
        for metric in self.metrics.values():
            metric.reset()

    def _update(self, prediction: Any, reference: Any, record_id: Hashable | None = None) -> None:
        """Updates all sub-metrics with the given data."""
        for metric in self.metrics.values():
            metric.update(prediction=prediction, reference=reference, record_id=record_id)

    def _compute(self, *args, **kwargs) -> dict[str, Any]:
        """Computes and returns the results of all sub-metrics.

        Returns:
            A dictionary mapping metric names to their computed results.
        """
        results = {}
        names = list(self.metrics.keys())
        if self.sort_fields:
            names = sorted(names)
        for name in names:
            results[name] = self.metrics[name].compute(*args, reset=False, **kwargs)
        return results

add_metric(name, metric)

Adds a new metric to the collection.

Source code in src/kibad_llm/metrics/collection.py
21
22
23
24
25
def add_metric(self, name: str, metric: T) -> None:
    """Adds a new metric to the collection."""
    if name in self.metrics:
        raise ValueError(f"Metric {name} already exists")
    self.metrics[name] = metric

reset()

Resets all sub-metrics.

Source code in src/kibad_llm/metrics/collection.py
27
28
29
30
def reset(self) -> None:
    """Resets all sub-metrics."""
    for metric in self.metrics.values():
        metric.reset()