@inproceedings{26705d0efc0a457cb1e3fd93185b88d5,
title = "Improved Vocal Effort Transfer Vector Estimation for Vocal Effort-Robust Speaker Verification",
abstract = "Despite the maturity of modern speaker verification technology, its performance still significantly degrades when facing non-neutrally-phonated (e.g., shouted and whispered) speech. To address this issue, in this paper, we propose a new speaker embedding compensation method based on a minimum mean square error (MMSE) estimator. This method models the joint distribution of the vocal effort transfer vector and nonneutrally-phonated embedding spaces and operates in a principal component analysis domain to cope with non-neutrallyphonated speech data scarcity. Experiments are carried out using a cutting-edge speaker verification system integrating a powerful self-supervised pre-trained model for speech representation. In comparison with a state-of-the-art embedding compensation method, the proposed MMSE estimator yields superior and competitive equal error rate results when tackling shouted and whispered speech, respectively.",
keywords = "Speaker verification, embedding compensation, shouted speech, vocal effort, whispered speech",
author = "Espejo, {Ivan Lopez} and Santiago Prieto-Calero and Alfonso Ortega and Eduardo Lleida",
year = "2023",
month = oct,
day = "23",
doi = "10.1109/MLSP55844.2023.10285923",
language = "English",
isbn = "979-8-3503-2412-9",
series = "IEEE Workshop on Machine Learning for Signal Processing",
editor = "Danilo Comminiello and Michele Scarpiniti",
booktitle = "Proceedings of the 2023 IEEE 33rd International Workshop on Machine Learning for Signal Processing, MLSP 2023",
publisher = "IEEE",
address = "United States",
note = "2023 IEEE 33rd International Workshop on Machine Learning for Signal Processing (MLSP) ; Conference date: 17-09-2023 Through 20-09-2023",
}