@inproceedings{c7c8a7f3040f4ef79fd52f70a2dd3249,
title = "基於多重注意力機制的輔助損失函數用於端到端語者標記",
abstract = "This study introduces a novel auxiliary function for use in the Self-Attention End-to-End Speaker Diarization (SA-EEND) model, aiming to achieve accurate speaker label prediction within overlapping speech regions. Previous research has lacked effective methods for leveraging speaker information within the model to enhance auxiliary model training and has not taken into account variations in the distribution of different speech activity patterns. This study proposes a novel auxiliary function to facilitate speaker label prediction within overlapping speech regions. By considering both the overall speech activity patterns and the task-specific speech activity patterns for different speakers, we adjust the weight matrices of the multi-head self-attention mechanism in the Transformer layers. We also select loss functions that can improve the learning performance for labels with fewer occurrences, resulting in better speaker discrimination. Experimental evaluations were conducted on Mini LibriSpeech. Although the results exhibited some limitations, there were still notable advancements made.",
keywords = "auxiliary loss, end-to-end neural diarization, multi-head attention, speaker diarization",
author = "Yang, {Yi Ting} and Li, {Jiun Ting} and Berlin Chen",
note = "Publisher Copyright: {\textcopyright} 2023 ROCLING 2023 - Proceedings of the 35th Conference on Computational Linguistics and Speech Processing. All rights reserved.; 35th Conference on Computational Linguistics and Speech Processing, ROCLING 2023 ; Conference date: 20-10-2023 Through 21-10-2023",
year = "2023",
language = "繁體中文",
series = "ROCLING 2023 - Proceedings of the 35th Conference on Computational Linguistics and Speech Processing",
publisher = "The Association for Computational Linguistics and Chinese Language Processing (ACLCLP)",
pages = "38--43",
editor = "Jheng-Long Wu and Ming-Hsiang Su and Hen-Hsen Huang and Yu Tsao and Hou-Chiang Tseng and Chia-Hui Chang and Lung-Hao Lee and Yuan-Fu Liao and Wei-Yun Ma",
booktitle = "ROCLING 2023 - Proceedings of the 35th Conference on Computational Linguistics and Speech Processing",
}