#!/usr/bin/env python
# vim: set fileencoding=utf-8 :
# Thu May 16 11:41:49 CEST 2013
"""Measures for calibration"""
import math
import numpy
[docs]def cllr(negatives, positives):
"""Cost of log likelihood ratio as defined by the Bosaris toolkit
Computes the 'cost of log likelihood ratio' (:math:`C_{llr}`) measure as
given in the Bosaris toolkit
Parameters:
negatives (array): 1D float array that contains the scores of the
"negative" (noise, non-class) samples of your classifier.
positives (array): 1D float array that contains the scores of the
"positive" (signal, class) samples of your classifier.
Returns:
float: The computed :math:`C_{llr}` value.
"""
sum_pos, sum_neg = 0.0, 0.0
for pos in positives:
sum_pos += math.log(1.0 + math.exp(-pos), 2.0)
for neg in negatives:
sum_neg += math.log(1.0 + math.exp(neg), 2.0)
return (sum_pos / len(positives) + sum_neg / len(negatives)) / 2.0
[docs]def min_cllr(negatives, positives):
"""Minimum cost of log likelihood ratio as defined by the Bosaris toolkit
Computes the 'minimum cost of log likelihood ratio' (:math:`C_{llr}^{min}`)
measure as given in the bosaris toolkit
Parameters:
negatives (array): 1D float array that contains the scores of the
"negative" (noise, non-class) samples of your classifier.
positives (array): 1D float array that contains the scores of the
"positive" (signal, class) samples of your classifier.
Returns:
float: The computed :math:`C_{llr}^{min}` value.
"""
# first, sort both scores
neg = sorted(negatives)
pos = sorted(positives)
N = len(neg)
P = len(pos)
II = N + P
# now, iterate through both score sets and add a 0 for negative and 1 for
# positive scores
n, p = 0, 0
ideal = numpy.zeros(II)
neg_indices = [0] * N
pos_indices = [0] * P
for i in range(II):
if p < P and (n == N or neg[n] > pos[p]):
pos_indices[p] = i
p += 1
ideal[i] = 1
else:
neg_indices[n] = i
n += 1
# compute the pool adjacent violaters method on the ideal LLR scores
ghat = numpy.ndarray(ideal.shape, dtype=numpy.float)
raise NotImplementedError("No pavx implementation")
pavx(ideal, ghat) # noqa: F821
# disable runtime warnings for a short time since log(0) will raise a warning
old_warn_setup = numpy.seterr(divide="ignore")
# ... compute logs
posterior_log_odds = numpy.log(ghat) - numpy.log(1.0 - ghat)
log_prior_odds = math.log(float(P) / float(N))
# ... activate old warnings
numpy.seterr(**old_warn_setup)
llrs = posterior_log_odds - log_prior_odds
# some weired addition
# for i in range(II):
# llrs[i] += float(i)*1e-6/float(II)
# unmix positive and negative scores
new_neg = numpy.zeros(N)
for n in range(N):
new_neg[n] = llrs[neg_indices[n]]
new_pos = numpy.zeros(P)
for p in range(P):
new_pos[p] = llrs[pos_indices[p]]
# compute cllr of these new 'optimal' LLR scores
return cllr(new_neg, new_pos)