Source code for bob.pad.voice.algorithm.gmm_algorithm

#!/usr/bin/env python
# vim: set fileencoding=utf-8 :
# @author: Pavel Korshunov <pavel.korshunov@idiap.ch>
# @date: Wed 19 Oct 23:43:22 2016

import bob.io.base

import numpy

import bob.learn.linear
import bob.learn.em

from bob.pad.base.algorithm import Algorithm

import logging

logger = logging.getLogger("bob.pad.voice")


class GmmAlgorithm(Algorithm):
    """Trains Logistical Regression classifier and projects testing dat on it."""

    def __init__(self,
                 normalize_features=False,
                 # parameters for the GMM
                 number_of_gaussians=512,
                 # parameters of UBM training
                 kmeans_training_iterations=25,  # Maximum number of iterations for K-Means
                 gmm_training_iterations=10,  # Maximum number of iterations for ML GMM Training
                 training_threshold=5e-4,  # Threshold to end the ML training
                 variance_threshold=5e-4,  # Minimum value that a variance can reach
                 update_weights=True,
                 update_means=True,
                 update_variances=True,
                 responsibility_threshold=0,
                 # If set, the weight of a particular Gaussian will at least be greater than this threshold. In the case the real weight is lower, the prior mean value will be used to estimate the current mean and variance.
                 INIT_SEED=2015,
                 requires_projector_training=False,
                 **kwargs):

        # call base class constructor registering that this tool performs everything.
        Algorithm.__init__(
            self,
            number_of_gaussians=number_of_gaussians,
            kmeans_training_iterations=kmeans_training_iterations,
            gmm_training_iterations=gmm_training_iterations,
            training_threshold=training_threshold,
            variance_threshold=variance_threshold,
            update_weights=update_weights,
            update_means=update_means,
            update_variances=update_variances,
            responsibility_threshold=responsibility_threshold,
            INIT_SEED=INIT_SEED,
            # parameters of detection pipeline
            performs_projection=True,
            requires_projector_training=requires_projector_training,
            use_projected_features_for_enrollment=False,
            multiple_model_scoring=None,
        )
        # copy parameters
        self.gaussians = number_of_gaussians
        self.kmeans_training_iterations = kmeans_training_iterations
        self.gmm_training_iterations = gmm_training_iterations
        self.training_threshold = training_threshold
        self.variance_threshold = variance_threshold
        self.update_weights = update_weights
        self.update_means = update_means
        self.update_variances = update_variances
        self.responsibility_threshold = responsibility_threshold
        self.init_seed = INIT_SEED
        self.rng = bob.core.random.mt19937(self.init_seed)

        self.gmm_machine_real = None
        self.gmm_machine_attack = None
        self.normalize_features = normalize_features
        self.kmeans_trainer = bob.learn.em.KMeansTrainer()
        self.gmm_trainer = bob.learn.em.ML_GMMTrainer(self.update_means, self.update_variances, self.update_weights,
                                                      self.responsibility_threshold)

    def _check_feature(self, feature, machine=None, projected=False):
        """Checks that the features are appropriate."""
        if not isinstance(feature, numpy.ndarray) or feature.ndim != 2 or feature.dtype != numpy.float64:
            raise ValueError("The given feature is not appropriate", feature)
        if self.gmm_machine_real is not None and feature.shape[1] != self.gmm_machine_real.shape[1]:
            raise ValueError("The given feature is expected to have %d elements, but it has %d" % (
            self.gmm_machine_real.shape[1], feature.shape[1]))
        if self.gmm_machine_attack is not None and feature.shape[1] != self.gmm_machine_attack.shape[1]:
            raise ValueError("The given feature is expected to have %d elements, but it has %d" % (
            self.gmm_machine_attack.shape[1], feature.shape[1]))
        return True

    #######################################################
    ################ GMM training #########################

[docs]    def train_gmm(self, array):

        logger.debug(" .... Training with %d feature vectors", array.shape[0])

        # Computes input size
        input_size = array.shape[1]

        # Creates the machines (KMeans and GMM)
        logger.debug(" .... Creating machines")
        kmeans_machine = bob.learn.em.KMeansMachine(self.gaussians, input_size)
        gmm_machine = bob.learn.em.GMMMachine(self.gaussians, input_size)

        # initialize the random generator with out one single cool seed that allows us to reproduce experiments
        logger.info("  -> Init random generator with seed %d", self.init_seed)
        self.rng = bob.core.random.mt19937(self.init_seed)

        # Trains using the KMeansTrainer
        logger.info("  -> Training K-Means")
        bob.learn.em.train(self.kmeans_trainer, kmeans_machine, array, self.kmeans_training_iterations,
                           self.training_threshold, self.rng)

        variances, weights = kmeans_machine.get_variances_and_weights_for_each_cluster(array)
        means = kmeans_machine.means

        # Initializes the GMM
        gmm_machine.means = means
        gmm_machine.variances = variances
        gmm_machine.weights = weights
        gmm_machine.set_variance_thresholds(self.variance_threshold)

        # Trains the GMM
        logger.info("  -> Training GMM")
        bob.learn.em.train(self.gmm_trainer, gmm_machine, array, self.gmm_training_iterations,
                           self.training_threshold, self.rng)
        return gmm_machine

[docs]    def save_gmms(self, projector_file):
        """Save projector to file"""
        # Saves the trained GMMs to file
        logger.debug(" .... Saving GMM models to file '%s'", projector_file)
        hdf5 = projector_file if isinstance(projector_file, bob.io.base.HDF5File) else bob.io.base.HDF5File(
            projector_file, 'w')
        hdf5.create_group('GMMReal')
        hdf5.cd('GMMReal')
        self.gmm_machine_real.save(hdf5)
        hdf5.cd('/')
        hdf5.create_group('GMMAttack')
        hdf5.cd('GMMAttack')
        self.gmm_machine_attack.save(hdf5)

[docs]    def train_projector(self, training_features, projector_file):
        if len(training_features) < 2:
            raise ValueError("Training projector: features should contain two lists: real and attack!")

        logger.info(" - Training: number of real features %d", len(training_features[0]))
        logger.info(" - Training: number of attack features %d", len(training_features[1]))

        [self._check_feature(feature) for feature in training_features[0]]
        [self._check_feature(feature) for feature in training_features[1]]

        # Loads the data into an arrays
        real_features = numpy.vstack(training_features[0])
        attack_features = numpy.vstack(training_features[1])

        print ("GmmAlgorithm:train_projector(), real_features shape:", real_features.shape)
        print ("GmmAlgorithm:train_projector(), attack_features shape:", attack_features.shape)
        print ("Min real ", numpy.min(real_features))
        print ("Max real ", numpy.max(real_features))
        print ("Min attack ", numpy.min(attack_features))
        print ("Max attack ", numpy.max(attack_features))

        logger.info("  -> Training GMM model with %s real training features", str(real_features.shape))
        self.gmm_machine_real = self.train_gmm(real_features)

        logger.info("  -> Training GMM model with %s attack training features", str(attack_features.shape))
        self.gmm_machine_attack = self.train_gmm(attack_features)

        self.save_gmms(projector_file)

[docs]    def load_projector(self, projector_file):

        # this is a hack to load pre-trained GMMs for licit and spoof protocols
        if '_spoof' in projector_file:
            hdf5file_spoof = bob.io.base.HDF5File(projector_file)
            projector_file_licit = projector_file.replace('_spoof', '_licit')
            hdf5file_licit = bob.io.base.HDF5File(projector_file_licit)
            self.gmm_machine_real = bob.learn.em.GMMMachine(hdf5file_licit)
            self.gmm_machine_attack = bob.learn.em.GMMMachine(hdf5file_spoof)
        else:  # this is a 'normal' case
            hdf5file = bob.io.base.HDF5File(projector_file)
            # read GMM for real data
            hdf5file.cd('/GMMReal')
            self.gmm_machine_real = bob.learn.em.GMMMachine(hdf5file)
            # read GMM for attack data
            hdf5file.cd('/GMMAttack')
            self.gmm_machine_attack = bob.learn.em.GMMMachine(hdf5file)

        self.gmm_machine_real.set_variance_thresholds(self.variance_threshold)
        self.gmm_machine_attack.set_variance_thresholds(self.variance_threshold)

[docs]    def project_feature(self, feature):

        feature = numpy.asarray(feature, dtype=numpy.float64)

        logger.debug(" .... Projecting %d features vector" % feature.shape[0])

        # return the resulting statistics
        return numpy.asarray([self.gmm_machine_real(feature), self.gmm_machine_attack(feature)], dtype=numpy.float64)

[docs]    def project(self, feature):
        """project(feature) -> projected

        Projects the given feature into GMM space.

        **Parameters:**

        feature : 1D :py:class:`numpy.ndarray`
          The 1D feature to be projected.

        **Returns:**

        projected : 1D :py:class:`numpy.ndarray`
          The ``feature`` projected into GMM space.
        """

        if len(feature) > 0:
            self._check_feature(feature)
            return self.project_feature(feature)
        else:
            return numpy.zeros(1, dtype=numpy.float64)

[docs]    def read_gmm_stats(self, gmm_stats_file):
        """Reads GMM stats from file."""
        hdf5file = bob.io.base.HDF5File(gmm_stats_file)
        # read GMM for real data
        hdf5file.cd('/GMMReal')
        gmm_stats_real = bob.learn.em.GMMStats(hdf5file)
        # read GMM for attack data
        hdf5file.cd('/GMMAttack')
        gmm_stats_attack = bob.learn.em.GMMStats(hdf5file)

        return [gmm_stats_real, gmm_stats_attack]

[docs]    def score(self, toscore):
        """Returns the difference between log likelihoods of being real or attack"""
        return [toscore[0] - toscore[1]]

[docs]    def score_for_multiple_projections(self, toscore):
        """Returns the difference between log likelihoods of being real or attack"""
        self.score(toscore)


algorithm = GmmAlgorithm()