Publications – Laboratory for Machine Intelligence

Beveridge, Ross; Zhang, Hao; Draper, Bruce A; Flynn, Patrick J; Feng, Zhenhua; Huber, Patrik; Kittler, Josef; Huang, Zhiwu; Li, Shaoxin; Li, Yan; Štruc, Vitomir; Križaj, Janez; others,

Report on the FG 2015 video person recognition evaluation Proceedings Article

In: 11th IEEE International Conference and Workshops on Automatic Face and Gesture Recognition (IEEE FG), pp. 1–8, IEEE 2015.

Abstract | Links | BibTeX | Tags: biometrics, competition, face verification, FG, group evaluation, PaSC, performance evaluation

Justin, Tadej; Štruc, Vitomir; Dobrišek, Simon; Vesnicer, Boštjan; Ipšić, Ivo; Mihelič, France

Speaker de-identification using diphone recognition and speech synthesis Proceedings Article

In: 11th IEEE International Conference and Workshops on Automatic Face and Gesture Recognition (IEEE FG): DeID 2015, pp. 1–7, IEEE 2015.

Abstract | Links | BibTeX | Tags: DEID, FG, speech deidentification, speech recognition, speech synthesis, speech technologies

@inproceedings{justin2015speaker,

title = {Speaker de-identification using diphone recognition and speech synthesis},

author = {Tadej Justin and Vitomir Štruc and Simon Dobrišek and Boštjan Vesnicer and Ivo Ipšić and France Mihelič},

url = {https://lmi.fe.uni-lj.si/en/speakerde-identificationusingdiphonerecognitionandspeechsynthesis/},

year  = {2015},

date = {2015-01-01},

urldate = {2015-01-01},

booktitle = {11th IEEE International Conference and Workshops on Automatic Face and Gesture Recognition (IEEE FG): DeID 2015},

volume = {4},

pages = {1--7},

organization = {IEEE},

abstract = {The paper addresses the problem of speaker (or voice) de-identification by presenting a novel approach for concealing the identity of speakers in their speech. The proposed technique first recognizes the input speech with a diphone recognition system and then transforms the obtained phonetic transcription into the speech of another speaker with a speech synthesis system. Due to the fact that a Diphone RecOgnition step and a sPeech SYnthesis step are used during the deidentification, we refer to the developed technique as DROPSY. With this approach the acoustical models of the recognition and synthesis modules are completely independent from each other, which ensures the highest level of input speaker deidentification. The proposed DROPSY-based de-identification approach is language dependent, text independent and capable of running in real-time due to the relatively simple computing methods used. When designing speaker de-identification technology two requirements are typically imposed on the deidentification techniques: i) it should not be possible to establish the identity of the speakers based on the de-identified speech, and ii) the processed speech should still sound natural and be intelligible. This paper, therefore, implements the proposed DROPSY-based approach with two different speech synthesis techniques (i.e, with the HMM-based and the diphone TDPSOLA- based technique). The obtained de-identified speech is evaluated for intelligibility and evaluated in speaker verification experiments with a state-of-the-art (i-vector/PLDA) speaker recognition system. The comparison of both speech synthesis modules integrated in the proposed method reveals that both can efficiently de-identify the input speakers while still producing intelligible speech.},

keywords = {DEID, FG, speech deidentification, speech recognition, speech synthesis, speech technologies},

pubstate = {published},

tppubtype = {inproceedings}

}

Close

Dobrišek, Simon; Štruc, Vitomir; Križaj, Janez; Mihelič, France

Face recognition in the wild with the Probabilistic Gabor-Fisher Classifier Proceedings Article

In: 11th IEEE International Conference and Workshops on Automatic Face and Gesture Recognition (IEEE FG): BWild 2015, pp. 1–6, IEEE 2015.

Abstract | Links | BibTeX | Tags: biometrics, BWild, FG, Gabor features, PaSC, plda, probabilistic Gabor Fisher classifier, probabilistic linear discriminant analysis

@inproceedings{dobrivsek2015face,

title = {Face recognition in the wild with the Probabilistic Gabor-Fisher Classifier},

author = {Simon Dobrišek and Vitomir Štruc and Janez Križaj and France Mihelič},

url = {https://lmi.fe.uni-lj.si/en/facerecognitioninthewildwiththeprobabilisticgabor-fisherclassifier/},

year  = {2015},

date = {2015-01-01},

urldate = {2015-01-01},

booktitle = {11th IEEE International Conference and Workshops on Automatic Face and Gesture Recognition (IEEE FG): BWild 2015},

volume = {2},

pages = {1--6},

organization = {IEEE},

abstract = {The paper addresses the problem of face recognition in the wild. It introduces a novel approach to unconstrained face recognition that exploits Gabor magnitude features and a simplified version of the probabilistic linear discriminant analysis (PLDA). The novel approach, named Probabilistic Gabor-Fisher Classifier (PGFC), first extracts a vector of Gabor magnitude features from the given input image using a battery of Gabor filters, then reduces the dimensionality of the extracted feature vector by projecting it into a low-dimensional subspace and finally produces a representation suitable for identity inference by applying PLDA to the projected feature vector. The proposed approach extends the popular Gabor-Fisher Classifier (GFC) to a probabilistic setting and thus improves on the generalization capabilities of the GFC method. The PGFC technique is assessed in face verification experiments on the Point and Shoot Face Recognition Challenge (PaSC) database, which features real-world videos of subjects performing everyday tasks. Experimental results on this challenging database show the feasibility of the proposed approach, which improves on the best results on this database reported in the literature by the time of writing.},

keywords = {biometrics, BWild, FG, Gabor features, PaSC, plda, probabilistic Gabor Fisher classifier, probabilistic linear discriminant analysis},

pubstate = {published},

tppubtype = {inproceedings}

}

Close

Križaj, Janez; Štruc, Vitomir; Dobrišek, Simon

Combining 3D face representations using region covariance descriptors and statistical models Proceedings Article

In: Proceedings of the IEEE International Conference on Automatic Face and Gesture Recognition and Workshops (IEEE FG), Workshop on 3D Face Biometrics, IEEE, Shanghai, China, 2013.

Abstract | Links | BibTeX | Tags: 3d face recognition, biometrics, covariance descriptors, face recognition, face verification, FG, gaussian mixture models, GMM, unscented transform

@inproceedings{FG2013,

title = {Combining 3D face representations using region covariance descriptors and statistical models},

author = {Janez Križaj and Vitomir Štruc and Simon Dobrišek},

url = {https://lmi.fe.uni-lj.si/en/combining3dfacerepresentationsusingregioncovariancedescriptorsandstatisticalmodels/},

year  = {2013},

date = {2013-05-01},

urldate = {2013-05-01},

booktitle = {Proceedings of the IEEE International Conference on Automatic Face and Gesture Recognition and Workshops (IEEE FG), Workshop on 3D Face Biometrics},

publisher = {IEEE},

address = {Shanghai, China},

abstract = {The paper introduces a novel framework for 3D face recognition that capitalizes on region covariance descriptors and Gaussian mixture models. The framework presents an elegant and coherent way of combining multiple facial representations, while simultaneously examining all computed representations at various levels of locality. The framework first computes a number of region covariance matrices/descriptors from different sized regions of several image representations and then adopts the unscented transform to derive low-dimensional feature vectors from the computed descriptors. By doing so, it enables computations in the Euclidean space, and makes Gaussian mixture modeling feasible. In the last step a support vector machine classification scheme is used to make a decision regarding the identity of the modeled input 3D face image. The proposed framework exhibits several desirable characteristics, such as an inherent mechanism for data fusion/integration (through the region covariance matrices), the ability to examine the facial images at different levels of locality, and the ability to integrate domain-specific prior knowledge into the modeling procedure. We assess the feasibility of the proposed framework on the Face Recognition Grand Challenge version 2 (FRGCv2) database with highly encouraging results.},

keywords = {3d face recognition, biometrics, covariance descriptors, face recognition, face verification, FG, gaussian mixture models, GMM, unscented transform},

pubstate = {published},

tppubtype = {inproceedings}

}

Close