@inproceedings{8cf9a523aebe4fc093502226edf1a2b9,
title = "Regularized estimation of mixture models for robust pseudo-relevance feedback",
abstract = "Pseudo-relevance feedback has proven to be an effective strategy for improving retrieval accuracy in all retrieval models. However the performance of existing pseudo feedback methods is often affected significantly by some parameters, such as the number of feedback documents to use and the relative weight of original query terms; these parameters generally have to be set by trial-and-error without any guidance. In this paper, we present a more robust method for pseudo feedback based on statistical language models. Our main idea is to integrate the original query with feedback documents in a single probabilistic mixture model and regularize the estimation of the language model parameters in the model so that the information in the feedback documents can be gradually added to the original query. Unlike most existing feedback methods, our new method has no parameter to tune. Experiment results on two representative data sets show that the new method is significantly more robust than a state-of-the-art baseline language modeling approach for feedback with comparable or better retrieval accuracy.",
keywords = "EM, Mixture model, Pseudo feedback, Regulation",
author = "Tao Tao and Zhai, {Cheng Xiang}",
year = "2006",
doi = "10.1145/1148170.1148201",
language = "English (US)",
isbn = "1595933697",
series = "Proceedings of the Twenty-Ninth Annual International ACM SIGIR Conference on Research and Development in Information Retrieval",
publisher = "Association for Computing Machinery",
pages = "162--169",
booktitle = "Proceedings of the Twenty-Ninth Annual International ACM SIGIR Conference on Research and Development in Information Retrieval",
address = "United States",
note = "29th Annual International ACM SIGIR Conference on Research and Development in Information Retrieval ; Conference date: 06-08-2006 Through 11-08-2006",
}