Source code for bob.measure

# import Libraries of other lib packages
import bob.math
import bob.io.base

from ._library import *
from . import version
from .version import module as __version__

from . import plot
from . import calibration
from . import load
import numpy


[docs]def fprfnr(negatives, positives, threshold): """Alias for :py:func:`bob.measure.farfrr`""" return farfrr(negatives, positives, threshold)
[docs]def mse (estimation, target): """Mean square error between a set of outputs and target values Uses the formula: .. math:: MSE(\hat{\Theta}) = E[(\hat{\Theta} - \Theta)^2] Estimation (:math:`\hat{\Theta}`) and target (:math:`\Theta`) are supposed to have 2 dimensions. Different examples are organized as rows while different features in the estimated values or targets are organized as different columns. Parameters: estimation (array): an N-dimensional array that corresponds to the value estimated by your procedure target (array): an N-dimensional array that corresponds to the expected value Returns: float: The average of the squared error between the estimated value and the target """ return numpy.mean((estimation - target)**2, 0)
[docs]def rmse (estimation, target): """Calculates the root mean square error between a set of outputs and target Uses the formula: .. math:: RMSE(\hat{\Theta}) = \sqrt(E[(\hat{\Theta} - \Theta)^2]) Estimation (:math:`\hat{\Theta}`) and target (:math:`\Theta`) are supposed to have 2 dimensions. Different examples are organized as rows while different features in the estimated values or targets are organized as different columns. Parameters: estimation (array): an N-dimensional array that corresponds to the value estimated by your procedure target (array): an N-dimensional array that corresponds to the expected value Returns: float: The square-root of the average of the squared error between the estimated value and the target """ return numpy.sqrt(mse(estimation, target))
[docs]def relevance (input, machine): """Calculates the relevance of every input feature to the estimation process Uses the formula: Neural Triggering System Operating on High Resolution Calorimetry Information, Anjos et al, April 2006, Nuclear Instruments and Methods in Physics Research, volume 559, pages 134-138 .. math:: R(x_{i}) = |E[(o(x) - o(x|x_{i}=E[x_{i}]))^2]| In other words, the relevance of a certain input feature **i** is the change on the machine output value when such feature is replaced by its mean for all input vectors. For this to work, the `input` parameter has to be a 2D array with features arranged column-wise while different examples are arranged row-wise. Parameters: input (array): an N-dimensional array that corresponds to the value estimated by your model machine (object): A machine that can be called to "process" your input Returns: array: An 1D float array as large as the number of columns (second dimension) of your input array, estimating the "relevance" of each input column (or feature) to the score provided by the machine. """ o = machine(input) i2 = input.copy() retval = numpy.ndarray((input.shape[1],), 'float64') retval.fill(0) for k in range(input.shape[1]): i2[:,:] = input #reset i2[:,k] = numpy.mean(input[:,k]) retval[k] = (mse(machine(i2), o).sum())**0.5 return retval
[docs]def recognition_rate(cmc_scores, threshold = None, rank = 1): """Calculates the recognition rate from the given input It is identical to the CMC value for the given ``rank``. The input has a specific format, which is a list of two-element tuples. Each of the tuples contains the negative :math:`\\{S_p^-\\}` and the positive :math:`\\{S_p^+\\}` scores for one probe item :math:`p`, or ``None`` in case of open set recognition. If ``threshold`` is set to ``None``, the rank 1 recognition rate is defined as the number of test items, for which the highest positive :math:`\\max\\{S_p^+\\}` score is greater than or equal to all negative scores, divided by the number of all probe items :math:`P`: .. math:: \\mathrm{RR} = \\frac{1}{P} \\sum_{p=1}^{P} \\begin{cases} 1 & \\mathrm{if } \\max\\{S_p^+\\} >= \\max\\{S_p^-\\}\\\\ 0 & \\mathrm{otherwise} \\end{cases} For a given rank :math:`r>1`, up to :math:`r` negative scores that are higher than the highest positive score are allowed to still count as correctly classified in the top :math:`r` rank. If ``threshold`` :math:`\\theta` is given, **all** scores below threshold will be filtered out. Hence, if all positive scores are below threshold :math:`\\max\\{S_p^+\\} < \\theta`, the probe will be misclassified **at any rank**. For open set recognition, i.e., when there exist a tuple including negative scores without corresponding positive scores (``None``), and **all** negative scores are below ``threshold`` :math:`\\max\\{S_p^+\\} < \\theta`, the probe item is correctly rejected, **and it does not count into the denominator** :math:`P`. When no ``threshold`` is provided, the open set probes will **always** count as misclassified, regardless of the ``rank``. .. warn: For open set tests, this rate does not correspond to a standard rate. Please use :py:func:`detection_identification_rate` and :py:func:`false_alarm_rate` instead. Parameters: cmc_scores (:py:class:`list`): A list in the format ``[(negatives, positives), ...]`` containing the CMC scores (i.e. :py:class:`list`: A list of tuples, where each tuple contains the ``negative`` and ``positive`` scores for one probe of the database). Each pair contains the ``negative`` and the ``positive`` scores for **one probe item**. Each pair can contain up to one empty array (or ``None``), i.e., in case of open set recognition. threshold (:obj:`float`, optional): Decision threshold. If not ``None``, **all** scores will be filtered by the threshold. In an open set recognition problem, all open set scores (negatives with no corresponding positive) for which all scores are below threshold, will be counted as correctly rejected and **removed** from the probe list (i.e., the denominator). rank (:obj:`int`, optional): The rank for which the recognition rate should be computed, 1 by default. Returns: float: The (open set) recognition rate for the given rank, a value between 0 and 1. """ # If no scores are given, the recognition rate is exactly 0. if not cmc_scores: return 0. correct = 0 counter = 0 for neg, pos in cmc_scores: # set all values that are empty before to None if pos is not None and not numpy.array(pos).size: pos = None if neg is not None and not numpy.array(neg).size: neg = None if pos is None and neg is None: raise ValueError("One pair of the CMC scores has neither positive nor negative values") # filter out any negative or positive scores below threshold; scores with exactly the threshold are also filtered out # now, None and an empty array have different meanings. if threshold is not None: if neg is not None: neg = numpy.array(neg)[neg > threshold] if pos is not None: pos = numpy.array(pos)[pos > threshold] if pos is None: # no positives, so we definitely do not have a match; # check if we have negatives above threshold if not neg.size: # we have no negative scores over the threshold, so we have correctly rejected the probe # don't increase any of the two counters... continue # we have negatives over threshold, so we have incorrect classifications; independent on the actual rank counter += 1 else: # we have a positive, so we need to count the probe counter += 1 if not numpy.array(pos).size: # all positive scores have been filtered out by the threshold, we definitely have a mis-match continue # get the maximum positive score for the current probe item # (usually, there is only one positive score, but just in case...) max_pos = numpy.max(pos) if neg is None or not numpy.array(neg).size: # if we had no negatives, or all negatives were below threshold, we have a match at rank 1 correct += 1 else: # count the number of negative scores that are higher than the best positive score index = numpy.sum(neg >= max_pos) if index < rank: correct += 1 return float(correct) / float(counter)
[docs]def cmc(cmc_scores): """Calculates the cumulative match characteristic (CMC) from the given input. The input has a specific format, which is a list of two-element tuples. Each of the tuples contains the negative and the positive scores for one probe item. For each probe item the probability that the rank :math:`r` of the positive score is calculated. The rank is computed as the number of negative scores that are higher than the positive score. If several positive scores for one test item exist, the **highest** positive score is taken. The CMC finally computes how many test items have rank r or higher, divided by the total number of test values. .. note:: The CMC is not available for open set classification. Please use the :py:func:`detection_identification_rate` and :py:func:`false_alarm_rate` instead. Parameters ---------- cmc_scores : :py:class:`list` A list in the format ``[(negatives, positives), ...]`` containing the CMC scores. Each pair contains the ``negative`` and the ``positive`` scores for **one probe item**. Each pair can contain up to one empty array (or ``None``), i.e., in case of open set recognition. Returns ------- 1D :py:class:`numpy.ndarray` of `float` A 1D float array representing the CMC curve. The rank 1 recognition rate can be found in ``array[0]``, rank 2 rate in ``array[1]``, and so on. The number of ranks (``array.shape[0]``) is the number of gallery items. Values are in range ``[0,1]``. """ # If no scores are given, we cannot plot anything probe_count = float(len(cmc_scores)) if not probe_count: raise ValueError("The given set of scores is empty") # compute MC match_characteristic = numpy.zeros((max([len(neg) for neg, _ in cmc_scores if neg is not None])+1,), numpy.int) for neg, pos in cmc_scores: if pos is None or not numpy.array(pos).size: raise ValueError("For the CMC computation at least one positive score per pair is necessary.") if neg is None: neg = [] # get the maximum positive score for the current probe item # (usually, there is only one positive score, but just in case...) max_pos = numpy.max(pos) # count the number of negative scores that are higher than the best positive score index = numpy.sum(neg >= max_pos) match_characteristic[index] += 1 # cumulate cumulative_match_characteristic = numpy.cumsum(match_characteristic, dtype=numpy.float64) return cumulative_match_characteristic / probe_count
[docs]def detection_identification_rate(cmc_scores, threshold, rank = 1): """Computes the `detection and identification rate` for the given threshold. This value is designed to be used in an open set identification protocol, and defined in Chapter 14.1 of [LiJain2005]_. Although the detection and identification rate is designed to be computed on an open set protocol, it uses only the probe elements, for which a corresponding gallery element exists. For closed set identification protocols, this function is identical to :py:func:`recognition_rate`. The only difference is that for this function, a ``threshold`` for the scores need to be defined, while for :py:func:`recognition_rate` it is optional. Parameters: cmc_scores (:py:class:`list`): A list in the format ``[(negatives, positives), ...]`` containing the CMC. Each pair contains the ``negative`` and the ``positive`` scores for **one probe item**. Each pair can contain up to one empty array (or ``None``), i.e., in case of open set recognition. threshold (float): The decision threshold :math:`\\tau``. rank (:obj:`int`, optional): The rank for which the curve should be plotted Returns: float: The detection and identification rate for the given threshold. """ # count the correctly classifier probes correct = 0 counter = 0 for neg, pos in cmc_scores: if pos is None or not numpy.array(pos).size: # we only consider probes with corresponding gallery items continue # we have an in-gallery probe counter += 1 # check, if it is correctly classified if neg is None: neg = [] # get the maximum positive score for the current probe item # (usually, there is only one positive score, but just in case...) max_pos = numpy.max(pos) index = numpy.sum(neg >= max_pos) # compute the rank (in fact, rank - 1) if max_pos >= threshold and index < rank: correct += 1 if not counter: logger.warn("No in-gallery probe was found") return 0. return float(correct) / float(counter)
[docs]def false_alarm_rate(cmc_scores, threshold): """Computes the `false alarm rate` for the given threshold,. This value is designed to be used in an open set identification protocol, and defined in Chapter 14.1 of [LiJain2005]_. The false alarm rate is designed to be computed on an open set protocol, it uses only the probe elements, for which **no** corresponding gallery element exists. Parameters: cmc_scores (:py:class:`list`): A list in the format ``[(negatives, positives), ...]`` containing the CMC scores (i.e. :py:class:`list`: A list of tuples, where each tuple contains the ``negative`` and ``positive`` scores for one probe of the database). Each pair contains the ``negative`` and the ``positive`` scores for **one probe item**. Each pair can contain up to one empty array (or ``None``), i.e., in case of open set recognition. threshold (float): The decision threshold :math:`\\tau``. Returns: float: The false alarm rate. """ incorrect = 0 counter = 0 for neg, pos in cmc_scores: # we only consider the out-of-gallery probes, i.e., with no positive scores if pos is None or not numpy.array(pos).size: counter += 1 # check if the probe is above threshold if neg is None or not numpy.array(neg).size: raise ValueError("One pair of the CMC scores has neither positive nor negative values") if numpy.max(neg) >= threshold: incorrect += 1 if not counter: logger.warn("No out-of-gallery probe was found") return 0. return float(incorrect) / float(counter)
[docs]def eer(negatives, positives, is_sorted=False, also_farfrr=False): """Calculates the Equal Error Rate (EER). Please note that it is possible that eer != fpr != fnr. This function returns (fpr + fnr) / 2 as eer. If you also need the fpr and fnr values, set ``also_farfrr`` to ``True``. Parameters ---------- negatives : ``array_like (1D, float)`` The scores for comparisons of objects of different classes. positives : ``array_like (1D, float)`` The scores for comparisons of objects of the same class. is_sorted : bool Are both sets of scores already in ascendantly sorted order? also_farfrr : bool If True, it will also return far and frr. Returns ------- eer : float The Equal Error Rate (EER). fpr : float The False Positive Rate (FPR). Returned only when ``also_farfrr`` is ``True``. fnr : float The False Negative Rate (FNR). Returned only when ``also_farfrr`` is ``True``. """ threshold = eer_threshold(negatives, positives, is_sorted) far, frr = farfrr(negatives, positives, threshold) if also_farfrr: return (far + frr) / 2.0, far, frr return (far + frr) / 2.0
[docs]def roc_auc_score(negatives, positives, npoints=2000, min_far=-8, log_scale=False): """Area Under the ROC Curve. Computes the area under the ROC curve. This is useful when you want to report one number that represents an ROC curve. This implementation uses the trapezoidal rule for the integration of the ROC curve. For more information, see: https://en.wikipedia.org/wiki/Receiver_operating_characteristic#Area_under_the_curve Parameters ---------- negatives : array_like The negative scores. positives : array_like The positive scores. npoints : int, optional Number of points in the ROC curve. Higher numbers leads to more accurate ROC. min_far : float, optional Min FAR and FRR values to consider when calculating ROC. log_scale : bool, optional If True, converts the x axis (FPR) to log10 scale before calculating AUC. This is useful in cases where len(negatives) >> len(positives) Returns ------- float The ROC AUC. If ``log_scale`` is False, the value should be between 0 and 1. """ fpr, fnr = roc(negatives, positives, npoints, min_far=min_far) tpr = 1 - fnr if log_scale: fpr_pos = fpr > 0 fpr, tpr = fpr[fpr_pos], tpr[fpr_pos] fpr = numpy.log10(fpr) area = -1 * numpy.trapz(tpr, fpr) return area
[docs]def get_config(): """Returns a string containing the configuration information. """ import bob.extension return bob.extension.get_config(__name__, version.externals)
# gets sphinx autodoc done right - don't remove it __all__ = [_ for _ in dir() if not _.startswith('_')]