@inproceedings{ad3064ced27646798aa1bcd4d4e6f7af,
title = "Learning when to listen: Detecting system-addressed speech in human-human-computer dialog",
abstract = "New challenges arise for addressee detection when multiple people interact jointly with a spoken dialog system using unconstrained natural language. We study the problem of discriminating computer-directed from human-directed speech in a new corpus of human-human-computer (H-H-C) dialog, using lexical and prosodic features. The prosodic features use no word, context, or speaker information. Results with 19% WER speech recognition show improvements from lexical features (EER=23.1%) to prosodic features (EER=12.6%) to a combined model (EER=11.1%). Prosodic features also provide a 35% error reduction over a lexical model using true words (EER from 10.2% to 6.7%). Modeling energy contours with GMMs provides a particularly good prosodic model. While lexical models perform well for commands, they confuse free-form system-directed speech with human-human speech. Prosodic models dramatically reduce these confusions, implying that users change speaking style as they shift addressees (computer versus human) within a session. Overall results provide strong support for combining simple acoustic-prosodic models with lexical models to detect speaking style differences for this task.",
keywords = "Addressee detection, Boosting, GMM, Language model, Logistic regression, Prosody, Spoken dialog system",
author = "Elizabeth Shriberg and Andreas Stolcke and Dilek Hakkani-T{\"u}r and Larry Heck",
year = "2012",
doi = "10.21437/interspeech.2012-83",
language = "English (US)",
isbn = "9781622767595",
series = "13th Annual Conference of the International Speech Communication Association 2012, INTERSPEECH 2012",
publisher = "International Speech Communication Association",
pages = "334--337",
booktitle = "13th Annual Conference of the International Speech Communication Association 2012, INTERSPEECH 2012",
note = "13th Annual Conference of the International Speech Communication Association 2012, INTERSPEECH 2012 ; Conference date: 09-09-2012 Through 13-09-2012",
}