@inproceedings{39d1be7efa4b47aab14045bc6a661ad1,
title = "Multiple Points Input for Convolutional Neural Networks in Replay Attack Detection",
abstract = "The models based on convolutional neural network (CNN) have shown remarkable performance in spoofing detection for automatic speaker verification. In order to input data into CNN-based models in mini-batch unit, the shape of all data in each mini-batch must be equal. Therefore, the method to make all data have the same length should be preceded because speeches have variable lengths. Segmentation is one of the methods to make the lengths of all data be equal. It divides the data into multiple segments using sliding window. Then, the models take one segment as input. However, it means that the amount of information that can be considered at one time is limited. We proposed the multiple points input method to increase the amount of information that can be considered at one time. The CNNs get input from multiple points in an utterance that are separated far enough to have different characteristics. The experimental results on ASVspoof 2019 physical access scenarios showed that our proposed method reduced the relative equal error rate by about 44% compared to the baseline.",
keywords = "ASVspoof, convolutional neural network, multiple points input, replay attack detection, sliding window",
author = "Yoon, {Sung Hyun} and Yu, {Ha Jin}",
note = "Publisher Copyright: {\textcopyright} 2020 IEEE.; 2020 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2020 ; Conference date: 04-05-2020 Through 08-05-2020",
year = "2020",
month = may,
doi = "10.1109/ICASSP40776.2020.9053303",
language = "English",
series = "ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "6444--6448",
booktitle = "2020 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2020 - Proceedings",
address = "United States",
}