
@Article{cmc.2024.047466,
AUTHOR = {Kazim Jawad, Muhammad Ahmad, Majdah Alvi, Muhammad Bux Alvi},
TITLE = {RUSAS: Roman Urdu Sentiment Analysis System},
JOURNAL = {Computers, Materials \& Continua},
VOLUME = {79},
YEAR = {2024},
NUMBER = {1},
PAGES = {1463--1480},
URL = {http://www.techscience.com/cmc/v79n1/56272},
ISSN = {1546-2226},
ABSTRACT = {Sentiment analysis, the meta field of Natural Language Processing (NLP), attempts to analyze and identify the sentiments in the opinionated text data. People share their judgments, reactions, and feedback on the internet using various languages. Urdu is one of them, and it is frequently used worldwide. Urdu-speaking people prefer to communicate on social media in Roman Urdu (RU), an English scripting style with the Urdu language dialect. Researchers have developed versatile lexical resources for features-rich comprehensive languages, but limited linguistic resources are available to facilitate the sentiment classification of Roman Urdu. This effort encompasses extracting subjective expressions in Roman Urdu and determining the implied opinionated text polarity. The primary sources of the dataset are Daraz (an e-commerce platform), Google Maps, and the manual effort. The contributions of this study include a Bilingual Roman Urdu Language Detector (BRULD) and a Roman Urdu Spelling Checker (RUSC). These integrated modules accept the user input, detect the text language, correct the spellings, categorize the sentiments, and return the input sentence’s orientation with a sentiment intensity score. The developed system gains strength with each input experience gradually. The results show that the language detector gives an accuracy of 97.1% on a close domain dataset, with an overall sentiment classification accuracy of 94.3%.},
DOI = {10.32604/cmc.2024.047466}
}



