@article {10.3844/jcssp.2019.1355.1377, article_type = {journal}, title = {A CURE Algorithm for Vietnamese Sentiment Classification in a Parallel Environment}, author = {Phu, Vo Ngoc and Ngoc Tran, Vo Thi and Max, Jack}, volume = {15}, number = {10}, year = {2018}, month = {Apr}, pages = {1355-1377}, doi = {10.3844/jcssp.2019.1355.1377}, url = {https://thescipub.com/abstract/jcssp.2019.1355.1377}, abstract = {Solutions to process big data are imperative and beneficial for numerous fields of research and commercial applications. Thus, a new model has been proposed in this paper to be used for big data set sentiment classification in the Cloudera parallel network environment. Clustering Using Representatives (CURE), combined with Hadoop MAP (M) / REDUCE (R) in Cloudera – a parallel network system, was used for 20,000 documents in a Vietnamese testing data set. The testing data set included 10,000 positive Vietnamese documents and 10,000 negative ones. After testing our new model on the data set, a 62.92% accuracy rate of sentiment classification was achieved. Although our data set is small, this proposed model is able to process millions of Vietnamese documents, in addition to data in other languages, to shorten the execution time in the distributed environment}, journal = {Journal of Computer Science}, publisher = {Science Publications} }