@inproceedings{f81c5d17e8064dbb9ca337f4d15353bb,
title = "Towards Quantifying and Reducing Language Mismatch Effects in Cross-Lingual Speech Anti-Spoofing",
abstract = "The effects of language mismatch impact speech anti-spoofing systems, while investigations and quantification of these effects remain limited. Existing anti-spoofing datasets are mainly in English, and the high cost of acquiring multilingual datasets hinders training language-independent models. We initiate this work by evaluating top-performing speech anti-spoofing systems that are trained on English data but tested on other languages, observing notable performance declines. We propose an innovative approach - Accent-based data expansion via TTS (ACCENT), which introduces diverse linguistic knowledge to monolingual-trained models, improving their cross-lingual capabilities. We conduct experiments on a large-scale dataset consisting of over 3 million samples, including 1.8 million training samples and nearly 1.2 million testing samples across 12 languages. The language mismatch effects are preliminarily quantified and remarkably reduced over 15% by applying the proposed ACCENT. This easily implementable method shows promise for multilingual and low-resource language scenarios.",
keywords = "accent, cross-lingual, deepfake detection, multilingual, speech anti-spoofing",
author = "Tianchi Liu and Ivan Kukanov and Zihan Pan and Qiongqiong Wang and Sailor, {Hardik B.} and Lee, {Kong Aik}",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; 2024 IEEE Spoken Language Technology Workshop, SLT 2024 ; Conference date: 02-12-2024 Through 05-12-2024",
year = "2024",
month = dec,
doi = "10.1109/SLT61566.2024.10832142",
language = "English",
series = "Proceedings of 2024 IEEE Spoken Language Technology Workshop, SLT 2024",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "1185--1192",
booktitle = "Proceedings of 2024 IEEE Spoken Language Technology Workshop, SLT 2024",
}