@inproceedings{e490a99427394c29a63e336662f0de6a,
title = "Sentiment analysis on Chinese movie review with distributed keyword vector representation",
abstract = "In the area of national language processing, performing machine learning technique on customer or movie review for sentiment analysis has been? frequently tried. While methods such as? support vector machine (SVM) were much favored in the 2000s, recently there is a steadily rising percentage of implementation with vector representation and artificial neural network. In this article we present an approach to implement word embedding method to conduct sentiment analysis on movie review from a renowned bulletin board system forum in Taiwan. After performing log-likelihood ratio (LLR) on the corpus and selecting the top 10000 most related keywords as representative vectors for different sentiments, we use these vectors as the sentiment classifier for the testing set. We achieved results that are not only comparable to traditional methods like Na{\"i}ve Bayes and SVM, but also outperform Latent Dirichlet Allocation, TF-IDF and its variant. It also tops the original LLR with a substantial margin.",
keywords = "LLR, machine learning, sentiment analysis, TF-IDF, word embedding",
author = "Chu, {Chun Han} and Wang, {Chen Ann} and Chang, {Yung Chun} and Wu, {Ying Wei} and Hsieh, {Yu Lun} and Hsu, {Wen Lian}",
note = "Publisher Copyright: {\textcopyright} 2016 IEEE.; 2016 Conference on Technologies and Applications of Artificial Intelligence, TAAI 2016 ; Conference date: 25-11-2016 Through 27-11-2016",
year = "2017",
month = mar,
day = "16",
doi = "10.1109/TAAI.2016.7880169",
language = "English",
series = "TAAI 2016 - 2016 Conference on Technologies and Applications of Artificial Intelligence, Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "84--89",
booktitle = "TAAI 2016 - 2016 Conference on Technologies and Applications of Artificial Intelligence, Proceedings",
address = "United States",
}