@inproceedings{dba0207065a04c898fce95585015a619,
title = "On the use of speaker-aware language model adaptation techniques for meeting speech recognition",
abstract = "This paper embarks on alleviating the problems caused by a multiple-speaker situation occurring frequently in a meeting for improved automatic speech recognition (ASR). There are a wide variety of ways for speakers to utter in the multiple-speaker situation. That is to say, people do not strictly follow the grammar when speaking and usually have a tendency to stutter while speaking, or often use personal idioms and some unique ways of speaking. Nevertheless, the existing language models employed in automatic transcription of meeting recordings rarely account for these facts but instead assume that all speakers participating in a meeting share the same speaking style or word-usage behavior. In turn, a single language model is built with all the manual transcripts of utterances compiled from multiple speakers that were taken holistically as the training set. To relax such an assumption, we endeavor to augment additional information cues into the training phase and the prediction phase of language modeling to accommodate the variety of speaker-related characteristics, through the process of speaker adaptation for language modeling. To this end, two disparate scenarios, i.e., {"}known speakers{"} and {"}unknown speakers,{"} for the prediction phase are taken into consideration for developing methods to extract speaker-related information cues to aid in the training of language models. Extensive experiments respectively carried out on automatic transcription of Mandarin and English meeting recordings show that the proposed language models along with different mechanisms for speaker adaption achieve good performance gains in relation to the baseline neural network based language model compared in this study.",
keywords = "Language modeling, Recurrent neural networks, Speaker adaptation, Speech recognition",
author = "Chen, {Ying Wen} and Lo, {Tien Hong} and Chang, {Hsiu Jui} and Chao, {Wei Cheng} and Berlin Chen",
note = "Publisher Copyright: {\textcopyright} 2018 The Association for Computational Linguistics and Chinese Language Processing.; 30th Conference on Computational Linguistics and Speech Processing, ROCLING 2018 ; Conference date: 04-10-2018 Through 05-10-2018",
year = "2018",
month = oct,
day = "1",
language = "English",
series = "Proceedings of the 30th Conference on Computational Linguistics and Speech Processing, ROCLING 2018",
publisher = "The Association for Computational Linguistics and Chinese Language Processing (ACLCLP)",
pages = "46--60",
editor = "Chi-Chun Lee and Cheng-Zen Yang and Jen-Tzung Chien and Chen-Yu Chiang and Min-Yuh Day and Tsai, {Richard T.-H.} and Hung-Yi Lee and Wen-Hsiang Lu and Shih-Hung Wu",
booktitle = "Proceedings of the 30th Conference on Computational Linguistics and Speech Processing, ROCLING 2018",
}