@inproceedings{771f81bbe5ae429383a500619b95c2cb,
title = "The Effects of Natural Language Processing on Big Data Analysis: Sentiment Analysis Case Study",
abstract = "The social networks are one of the main sources of big data. Continuously, it produce huge volume of variety types of data at high velocity rates. This huge volume of data contains valuable information that requires efficient and scalable analysis techniques to be extracted. Hadoop/MapReduce is considered the most suitable framework for handling big data because of its scalability, reliability and simplicity. One of the basic applications to extract valuable information from data is the sentiment analysis. The sentiment analysis studies peoples' opinion by classifying their written text into positive or negative polarity. In this work, a sentiment analysis method for analyzing a Twitter data set is analyzed. The method uses the Naive Bayes algorithm for classifying the text into positive and negative polarity. Several linguistic and NLP preprocessing techniques were applied on the data set. The aim of these preprocessing techniques is to study their effects on the quality of big data classification. The applied preprocessing techniques have achieved an enhancement in the classification accuracy of the Naive Bayes algorithm. The experiments prove that the performance of the sentiment analysis is enhanced by 5\% using NLP and linguistic processing, yielding an accuracy of 73 \% on the used data set.",
keywords = "Big Data, Mahout, MapReduce Framework, Naive Bayes, Natural Language Processing, Sentiment Analysis",
author = "Mariam Khader and Arafat Awajan and Ghazi Al-Naymat",
note = "Publisher Copyright: {\textcopyright} 2018 IEEE.; 19th International Arab Conference on Information Technology, ACIT 2018 ; Conference date: 28-11-2018 Through 30-11-2018",
year = "2018",
month = jul,
day = "2",
doi = "10.1109/ACIT.2018.8672697",
language = "English",
series = "ACIT 2018 - 19th International Arab Conference on Information Technology",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
booktitle = "ACIT 2018 - 19th International Arab Conference on Information Technology",
address = "United States",
}