@inproceedings{a69a7cfaab3843c698b6823c9072686b,
title = "Simultaneous Flexible Keyword Detection and Text-dependent Speaker Recognition for Low-resource Devices",
abstract = "This paper proposes a new method for simultaneous flexible keyword detection and text-dependent speaker identification using a recognized keyword. The purpose is to identify a speaker from among a set of preregistered speakers on the basis of a short-command utterance in an office or home on low-resource chip devices. The first contribution is to construct the process that includes a neural network (NN) and a customized Viterbi-based algorithm for flexible keyword detection, and Gaussian mixture models (GMMs) for speaker identification. Outputs of a middle layer in the NN and alignment information for keyword detection are also used for creating feature vectors for speaker GMMs. The second contribution is to apply DropConnect in speaker-modeling uncertainties of the Bayesian NN that is used for speaker reacognition. It results in robust speaker models when enrollment utterances are few. Evaluation was conducted using 39 Japanese keywords by 100 speakers. Recognition performance was measured on the basis of false acceptances and false rejects using keyword utterances. Speaker identification for 100 pre-registered speakers for recognized keywords was simultaneously evaluated. The identification rate when using a conventional i-vector method was 71.22\%. By contrast, the identification rate of the proposed method was 89.29\% while using low-cost resources.",
keywords = "Bayesian, Detection, Low Resource Device, Speaker Identification",
author = "Hiroshi Fujimura and Ning Ding and Daichi Hayakawa and Takehiko Kagoshima",
note = "Publisher Copyright: {\textcopyright} 2022 by SCITEPRESS Science and Technology Publications, Lda. All rights reserved.; 9th International Conference on Pattern Recognition Applications and Methods , ICPRAM 2020 ; Conference date: 22-02-2020 Through 24-02-2020",
year = "2020",
doi = "10.5220/0008903202970307",
language = "英语",
isbn = "9789897583971",
series = "International Conference on Pattern Recognition Applications and Methods",
publisher = "Science and Technology Publications, Lda",
pages = "297--307",
editor = "\{De Marsico\}, Maria and \{Sanniti di Baja\}, Gabriella and Fred, \{Ana L.N.\}",
booktitle = "ICPRAM 2020 - Proceedings of the 9th International Conference on Pattern Recognition Applications and Methods, Volume 1",
}