@inproceedings{0fccc510bd904f72ab4351c989b7151f,
title = "Arabic sentiment analysis: Lexicon-based and corpus-based",
abstract = "The emergence of the Web 2.0 technology generated a massive amount of raw data by enabling Internet users to post their opinions, reviews, comments on the web. Processing this raw data to extract useful information can be a very challenging task. An example of important information that can be automatically extracted from the users' posts and comments is their opinions on different issues, events, services, products, etc. This problem of Sentiment Analysis (SA) has been studied well on the English language and two main approaches have been devised: corpus-based and lexicon-based. This paper addresses both approaches to SA for the Arabic language. Since there is a limited number of publically available Arabic dataset and Arabic lexicons for SA, this paper starts by building a manually annotated dataset and then takes the reader through the detailed steps of building the lexicon. Experiments are conducted throughout the different stages of this process to observe the improvements gained on the accuracy of the system and compare them to corpus-based approach.",
keywords = "Arabic language, Corpus-based, Lexicon-based, Opinion mining, Sentiment analysis",
author = "Abdulla, \{Nawaf A.\} and Ahmed, \{Nizar A.\} and Shehab, \{Mohammed A.\} and Mahmoud Al-Ayyoub",
year = "2013",
doi = "10.1109/AEECT.2013.6716448",
language = "English",
isbn = "9781479923038",
series = "2013 IEEE Jordan Conference on Applied Electrical Engineering and Computing Technologies, AEECT 2013",
publisher = "IEEE Computer Society",
booktitle = "2013 IEEE Jordan Conference on Applied Electrical Engineering and Computing Technologies, AEECT 2013",
address = "United States",
note = "2013 2nd IEEE Jordan Conference on Applied Electrical Engineering and Computing Technologies, AEECT 2013 ; Conference date: 03-12-2013 Through 05-12-2013",
}