@inproceedings{79a014461bb0423eab740d57985d8232,
title = "Exploratory Investigation of Word Embedding in Song Lyric Topic Classification: Promising Preliminary Results",
abstract = "In this work we investigate a data-driven vector representation of word embedding for the task of classifying song lyrics into their semantic topics. Previous research on topic classification of song lyrics has used traditional frequency based text representation. On the other hand, empirically driven word embedding has shown sensible performance improvment of text classification tasks, because of its ability to capture semantic relationship between words from big data. As averaging the word vectors from a short text is known to work reasonably well compared to the other comprehensive models utilizing their order, we adopt the averaged word vectors from the lyrics and user's interpretations about them, which are short in general, as the feature for this classification task. This simple approach showed promising classification accuracy of 57%. From this, we envision the potential of the data-driven approaches to creating features, such as the sequence of word vectors and doc2vec models, to improve the performance of the system.",
keywords = "classification, metadata, song lyrics, subject, topic, word embedding",
author = "Kahyun Choi and {Stephen Downie}, J.",
note = "Publisher Copyright: {\textcopyright} 2018 Authors.; 18th ACM/IEEE Joint Conference on Digital Libraries, JCDL 2018 ; Conference date: 03-06-2018 Through 07-06-2018",
year = "2018",
month = may,
day = "23",
doi = "10.1145/3197026.3203883",
language = "English (US)",
series = "Proceedings of the ACM/IEEE Joint Conference on Digital Libraries",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "327--328",
booktitle = "JCDL 2018 - Proceedings of the 18th ACM/IEEE Joint Conference on Digital Libraries",
address = "United States",
}