
@Article{cmc.2020.08675,
AUTHOR = {Jinlin Wang, Xing Wang, Yuchen Yang, Hongli Zhang, Binxing Fang},
TITLE = {A Review of Data Cleaning Methods for Web Information System},
JOURNAL = {Computers, Materials \& Continua},
VOLUME = {62},
YEAR = {2020},
NUMBER = {3},
PAGES = {1053--1075},
URL = {http://www.techscience.com/cmc/v62n3/38341},
ISSN = {1546-2226},
ABSTRACT = {Web information system (WIS) is frequently-used and indispensable in daily 
social life. WIS provides information services in many scenarios, such as electronic 
commerce, communities, and edutainment. Data cleaning plays an essential role in 
various WIS scenarios to improve the quality of data service. In this paper, we present a 
review of the state-of-the-art methods for data cleaning in WIS. According to the 
characteristics of data cleaning, we extract the critical elements of WIS, such as 
interactive objects, application scenarios, and core technology, to classify the existing 
works. Then, after elaborating and analyzing each category, we summarize the 
descriptions and challenges of data cleaning methods with sub-elements such as data & 
user interaction, data quality rule, model, crowdsourcing, and privacy preservation. 
Finally, we analyze various types of problems and provide suggestions for future research 
on data cleaning in WIS from the technology and interactive perspective.},
DOI = {10.32604/cmc.2020.08675}
}



