Source code for brainscore_core.metrics

"""
A :class:`~brainscore.metrics.Metric` is part of a :class:`~brainscore.benchmarks.Benchmark`
and scores how similar two sets of data are.
Typically these two sets are model and primate measurements, but metrics are agnostic of the data source
and can also be used to compare two primate measurements (e.g. for ceiling estimates).
"""

import logging
import warnings

from brainio.assemblies import DataAssembly, merge_data_arrays

_logger = logging.getLogger(__name__)


[docs]class Score(DataAssembly):
    """
    Scores are used as the outputs of metrics, benchmarks, and ceilings. They indicate similarity or goodness-of-fit
    of sets of data. The high-level score is typically an aggregate of many smaller scores, e.g. the median of neuroid
    correlations. To keep records of these smaller scores, a score can store "raw" scores in its attributes
    (`score.attrs['raw']`).
    """

    RAW_VALUES_KEY = 'raw'

[docs]    def sel(self, *args, _apply_raw=True, **kwargs):
        return self._preserve_raw('sel', *args, **kwargs, _apply_raw=_apply_raw)

[docs]    def isel(self, *args, _apply_raw=True, **kwargs):
        return self._preserve_raw('isel', *args, **kwargs, _apply_raw=_apply_raw)

[docs]    def squeeze(self, *args, _apply_raw=True, **kwargs):
        return self._preserve_raw('squeeze', *args, **kwargs, _apply_raw=_apply_raw)

[docs]    def expand_dims(self, *args, _apply_raw=True, **kwargs):
        return self._preserve_raw('expand_dims', *args, **kwargs, _apply_raw=_apply_raw)

    def mean(self, *args, _apply_raw=False, **kwargs):
        return self._preserve_raw('mean', *args, **kwargs, _apply_raw=_apply_raw)

    def sum(self, *args, _apply_raw=False, **kwargs):
        return self._preserve_raw('sum', *args, **kwargs, _apply_raw=_apply_raw)

    def std(self, *args, _apply_raw=False, **kwargs):
        return self._preserve_raw('std', *args, **kwargs, _apply_raw=_apply_raw)

    def min(self, *args, _apply_raw=False, **kwargs):
        return self._preserve_raw('min', *args, **kwargs, _apply_raw=_apply_raw)

[docs]    def reduce(self, *args, _apply_raw=False, **kwargs):
        return self._preserve_raw('reduce', *args, **kwargs, _apply_raw=_apply_raw)

    def _preserve_raw(self, func, *args, _apply_raw=False, _ignore_errors=True, **kwargs):
        result = getattr(super(Score, self), func)(*args, **kwargs)
        for attr_key, attr_value in self.attrs.items():
            if self.RAW_VALUES_KEY in attr_key:
                if _apply_raw:
                    try:
                        attr_value = getattr(attr_value, func)(*args, **kwargs)
                    except Exception as e:
                        if _ignore_errors:
                            # ignore errors with warning. most users will likely only want to access the main score
                            _logger.debug(f"{func} on raw values failed: {repr(e)}")
                        else:
                            raise e
                result.attrs[attr_key] = attr_value
        return result

    def __setitem__(self, key, value, _apply_raw=True):
        super(Score, self).__setitem__(key, value)
        if _apply_raw:
            for attr_key in self.attrs:
                if self.RAW_VALUES_KEY in attr_key:
                    try:
                        self.attrs[attr_key].__setitem__(key, value)
                    except Exception as e:
                        _logger.debug(f"failed to set {key}={value} on raw values: " + (repr(e)))

[docs]    @classmethod
    def merge(cls, *scores, exception_handling: str = 'ignore'):
        """
        Merges the raw values in addition to the score assemblies.
        Raw values are indexed on the first score.

        :param exception_handling: how to deal with raised exceptions,
            one of 'ignore' (do not raise or log), 'warn' (log but do not raise), 'raise' (raise exception).
        """
        result = merge_data_arrays(scores)
        for attr_key in scores[0].attrs:
            if cls.RAW_VALUES_KEY in attr_key:
                attr_values = [score.attrs[attr_key] for score in scores]
                try:
                    attr_values = Score.merge(*attr_values, exception_handling=exception_handling)
                    result.attrs[attr_key] = attr_values
                except Exception as e:
                    if exception_handling == 'ignore':
                        pass
                    elif exception_handling == 'warn':
                        warnings.warn("failed to merge raw values: " + str(e))
                        pass
                    elif exception_handling == 'raise':
                        raise e
                    else:
                        raise ValueError(f"Unknown exception_handling argument '{exception_handling}'")
        return result


[docs]class Metric:
    """
    Metric interface.
    A metric compares two sets of data and outputs a score of how well they match (1 = identical, 0 = no match).
    """

[docs]    def __call__(self, assembly1: DataAssembly, assembly2: DataAssembly) -> Score:
        """
        Compare two assemblies on their similarity.
        These assemblies are typically neural or behavioral measurements, e.g. model and primate recordings.

        :param assembly1: the first assembly to compare against the second
        :param assembly2: the second assembly to compare against the first
        :return: a :class:`~brainscore_core.metrics.Score` denoting the match between the two assemblies
                (1 = identical, 0 = no match).
        """
        raise NotImplementedError()
Source code for brainscore_core.metrics

Brain-Score core

Navigation

Related Topics