@inproceedings{6ba4044e554d45d98ff351f6a454d7b7,
title = "A mixture model for contextual text mining",
abstract = "Contextual text mining is concerned with extracting topical themes from a text collection with context information (e.g., time and location) and comparing/analyzing the variations of themes over different contexts. Since the topics covered in a document are usually related to the context of the document, analyzing topical themes within context can potentially reveal many interesting theme patterns. In this paper, we propose a new general probabilistic model for contextual text mining that can cover several existing models as special cases. Specifically, we extend the probabilistic latent semantic analysis (PLSA) model by introducing context variables to model the context of a document. The proposed mixture model, called contextual probabilistic latent semantic analysis (CPLSA) model, can be applied to many interesting mining tasks, such as temporal text mining, spatiotemporal text mining, author-topic analysis, and cross-collection comparative analysis. Empirical experiments show that the proposed mixture model can discover themes and their contextual variations effectively.",
keywords = "Clustering, Context, Contextual text mining, EM algorithm, Mixture model, Theme pattern",
author = "Qiaozhu Mei and Zhai, {Cheng Xiang}",
year = "2006",
doi = "10.1145/1150402.1150482",
language = "English (US)",
isbn = "1595933395",
series = "Proceedings of the ACM SIGKDD International Conference on Knowledge Discovery and Data Mining",
publisher = "Association for Computing Machinery",
pages = "649--655",
booktitle = "KDD 2006",
address = "United States",
note = "KDD 2006: 12th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining ; Conference date: 20-08-2006 Through 23-08-2006",
}