@inproceedings{dd15fa2fa865445d9ae5eeb8535ff515,
title = "Extractive summarization using a latent variable model",
abstract = "Extractive multi-document summarization is the task of choosing sentences from a set of documents to compose a summary text in response to a user query. We propose a generative approach to explicitly identify summary and non-summary topic distributions in the sentences of a given set of documents (i.e., document cluster). Using these approximate summary topic probabilities as latent output variables, we build a discriminative classifier model. The sentences in new document clusters are inferred using the trained discriminative model. In our experiments we find that the proposed summarization approach is effective in comparison to the state-of-the-art methods.",
keywords = "Discriminative classification, Summarization, Topic modeling",
author = "Asli Celikyilmaz and Dilek Hakkani-T{\"u}r",
year = "2010",
language = "English (US)",
series = "Proceedings of the 11th Annual Conference of the International Speech Communication Association, INTERSPEECH 2010",
publisher = "International Speech Communication Association",
pages = "2526--2529",
booktitle = "Proceedings of the 11th Annual Conference of the International Speech Communication Association, INTERSPEECH 2010",
}