@inbook{e8206029a24e452b8a8878ee97863fcf,
title = "Multistream Dynamic Bayesian Network for Meeting Segmentation",
abstract = "This paper investigates the automatic analysis and segmentation of meetings. A meeting is analysed in terms of individual behaviours and group interactions, in order to decompose each meeting in a sequence of relevant phases, named meeting actions. Three feature families are extracted from multimodal recordings: prosody from individual lapel microphone signals, speaker activity from microphone array data and lexical features from textual transcripts. A statistical approach is then used to relate low-level features with a set of abstract categories. In order to provide a flexible and powerful framework, we have employed a dynamic Bayesian network based model, characterized by multiple stream processing and flexible state duration modelling. Experimental results demonstrate the strength of this system, providing a meeting action error rate of 9%.",
author = "Alfred Dielmann and Steve Renals",
year = "2005",
doi = "10.1007/978-3-540-30568-2_7",
language = "English",
isbn = "978-3-540-24509-4",
series = "Lecture Notes in Computer Science",
publisher = "Springer",
pages = "76--86",
editor = "Samy Bengio and Herv{\'e} Bourlard",
booktitle = "Machine Learning for Multimodal Interaction",
address = "United Kingdom",
note = "First International Workshop MLMI 2004 ; Conference date: 21-06-2004 Through 23-06-2004",
}