@inproceedings{95aabd22e1d14ac0a45725f899260ebb,
title = "Probabilistic model-based sentiment analysis of twitter messages",
abstract = "We present a machine learning approach to sentiment classification on twitter messages (tweets). We classify each tweet into two categories: polar and non-polar. Tweets with positive or negative sentiment are considered polar. They are considered non-polar otherwise. Sentiment analysis of tweets can potentially benefit different parties, such as consumers and marketing researchers, for obtaining opinions on different products and services. We present methods for text normalization of the noisy tweets and their classification with respect to the polarity. We experiment with a mixture model approach for generation of sentimental words, which are later used as indicator features of the classification model. Based on a gold standard manually annotated ensemble of tweets, with the new approach, we obtain F-scores that are relatively 10% better than a classification baseline that uses raw word n-gram features.",
keywords = "Feature extraction, Micro-blogs, Probabilistic graphical models, Sentiment analysis, Twitter",
author = "Asli Celikyilmaz and Dilek Hakkani-T{\"u}r and Junlan Feng",
year = "2010",
doi = "10.1109/SLT.2010.5700826",
language = "English (US)",
isbn = "9781424479030",
series = "2010 IEEE Workshop on Spoken Language Technology, SLT 2010 - Proceedings",
pages = "79--84",
booktitle = "2010 IEEE Workshop on Spoken Language Technology, SLT 2010 - Proceedings",
note = "2010 IEEE Workshop on Spoken Language Technology, SLT 2010 ; Conference date: 12-12-2010 Through 15-12-2010",
}