@inproceedings{f2d45ae2c0b34f4897743236a3c4ff85,
title = "Retrieving Webpages Using Online Discussions",
abstract = "Online discussions are a ubiquitous aspect of everyday life. An Internet user who interacts with an online discussion may benefit from seeing hyperlinks to webpages relevant to the discussion because the relevant webpages can provide added context, act as citations for background sources, or condense information so that conversations can proceed seamlessly at a high level. In this paper, we propose and study a new task of retrieving relevant webpages given an online discussion. We frame the task as a novel retrieval problem where we treat a sequence of comments in an online discussion as a query and use such a query to retrieve relevant webpages. We construct a new data set using Reddit, an online discussion forum, to study this new problem. We explore and evaluate multiple representative retrieval methods to examine their effectiveness for solving this new problem. We also propose to leverage the comments that contain hyperlinks as training data to enable supervised learning and further improve retrieval performance. We find that results using modern retrieval methods are promising and that leveraging comments with hyperlinks as training data can further improve performance. We release our data set and code to enable additional research in this direction.",
keywords = "discussion forums, hyperlink prediction, information retrieval",
author = "Kevin Ros and Matthew Jin and Jacob Levine and Zhai, {Cheng Xiang}",
note = "This work is supported in part by the IBM-Illinois Discovery Accelerator Institute and by the National Science Foundation under Grant No. 1801652.; 9th ACM SIGIR International Conference on the Theory of Information Retrieval, ICTIR 2023 ; Conference date: 23-07-2023",
year = "2023",
month = aug,
day = "9",
doi = "10.1145/3578337.3605139",
language = "English (US)",
series = "ICTIR 2023 - Proceedings of the 2023 ACM SIGIR International Conference on the Theory of Information Retrieval",
publisher = "Association for Computing Machinery",
pages = "159--168",
booktitle = "ICTIR 2023 - Proceedings of the 2023 ACM SIGIR International Conference on the Theory of Information Retrieval",
address = "United States",
}