#!/usr/bin/env python
# vim: set fileencoding=utf-8 :
# Pavel Korshunov <pavel.korshunov@idiap.ch>
# Tue 17 May 15:43:22 CEST 2016
"""
ASVspoof database implementation of bob.bio.base.BioDatabase interface.
It is an extension of an SQL-based database interface, which directly talks to ASVspoof database, for
verification experiments (good to use in bob.bio.base framework).
"""
from bob.bio.base.database import BioDatabase
from bob.bio.spear.database import AudioBioFile
class ASVspoofBioFile(AudioBioFile):
def __init__(self, f):
"""
Initializes this File object with an File equivalent from the underlying SQl-based interface for
ASVspoof database.
"""
super(ASVspoofBioFile, self).__init__(client_id=f.client_id, path=f.path, file_id=f.id)
self.__f = f
class ASVspoofBioDatabase(BioDatabase):
"""
Implements verification API for querying ASVspoof database.
"""
def __init__(self, **kwargs):
# call base class constructors to open a session to the database
super(ASVspoofBioDatabase, self).__init__(name='asvspoof', **kwargs)
from bob.db.asvspoof.query import Database as LowLevelDatabase
self._db = LowLevelDatabase()
self.low_level_group_names = ('train', 'dev', 'eval')
self.high_level_group_names = ('world', 'dev', 'eval')
[docs] def model_ids_with_protocol(self, groups=None, protocol=None, gender=None):
groups = self.convert_names_to_lowlevel(groups, self.low_level_group_names, self.high_level_group_names)
return [client.id for client in self._db.clients(groups=groups, gender=gender)]
[docs] def objects(self, protocol=None, purposes=None, model_ids=None, groups=None, **kwargs):
# convert group names from the conventional in verification experiments to the internal database names
if groups is None: # all groups are assumed
groups = self.high_level_group_names
matched_groups = self.convert_names_to_lowlevel(groups, self.low_level_group_names, self.high_level_group_names)
# this conversion of the protocol with appended '-licit' or '-spoof' is a hack for verification experiments.
# To adapt spoofing databases to the verification experiments, we need to be able to split a given protocol
# into two parts: when data for licit (only real/genuine data is used) and data for spoof (attacks are used instead
# of real data) is used in the experiment. Hence, we use this trick with appending '-licit' or '-spoof' to the
# protocol name, so we can distinguish these two scenarios.
# By default, if nothing is appended, we assume licit protocol.
# The distinction between licit and spoof is expressed via purposes parameters
# this is the difference in terminology.
# lets check if we have an appendix to the protocol name
appendix = None
if protocol:
appendix = protocol.split('-')[-1]
# if protocol was empty or there was no correct appendix, we just assume the 'licit' option
if not (appendix == 'licit' or appendix == 'spoof'):
appendix = 'licit'
else:
# put back everything except the appendix into the protocol
protocol = '-'.join(protocol.split('-')[:-1])
# if protocol was empty, we set it to the ASV-female, which is the female data for verification experiments
if not protocol:
protocol = 'ASV-female'
correct_purposes = purposes
# licit protocol is for real access data only
if appendix == 'licit':
# by default we assume all real data
if purposes is None:
correct_purposes = ('real', 'impostor')
# otherwise replace 'probe' with 'impostor'
elif isinstance(purposes, (tuple, list)):
correct_purposes = []
for purpose in purposes:
if purpose == 'probe':
correct_purposes += ['impostor']
else:
correct_purposes += [purpose]
elif purposes == 'probe':
correct_purposes = ('impostor',)
# for any other protocol use real data and spoofed data (probe)
# so, probe set is the same as attack set
else:
# by default we return attacks only for 'world' group
# and (real:realdata + probe:attackdata) for dev and eval
if purposes is None:
correct_purposes = ('attack',) if 'train' in matched_groups else ('real', 'attack')
# otherwise replace 'probe' with 'attack'
elif isinstance(purposes, (tuple, list)):
correct_purposes = []
for purpose in purposes:
if purpose == 'probe':
correct_purposes += ['attack']
else:
correct_purposes += [purpose]
elif purposes == 'probe':
correct_purposes = ('attack',)
# now, query the actual ASVspoof database
objects = self._db.objects(protocol=protocol, groups=matched_groups, purposes=correct_purposes,
clients=model_ids, **kwargs)
# make sure to return AudioBioFile representation of a file, not the database one
return [ASVspoofBioFile(f) for f in objects]
[docs] def annotations(self, file):
return None