@Article{cmes.2022.020128,
AUTHOR = {Bao Rong Chang, Hsiu-Fen Tsai, Yu-Chieh Lin},
TITLE = {Optimizing Big Data Retrieval and Job Scheduling Using Deep Learning Approaches},
JOURNAL = {Computer Modeling in Engineering \& Sciences},
VOLUME = {134},
YEAR = {2023},
NUMBER = {2},
PAGES = {783--815},
URL = {http://www.techscience.com/CMES/v134n2/49504},
ISSN = {1526-1506},
ABSTRACT = {Big data analytics in business intelligence do not provide effective data retrieval methods and job scheduling that
will cause execution inefficiency and low system throughput. This paper aims to enhance the capability of data
retrieval and job scheduling to speed up the operation of big data analytics to overcome inefficiency and low
throughput problems. First, integrating stacked sparse autoencoder and Elasticsearch indexing explored fast data
searching and distributed indexing, which reduces the search scope of the database and dramatically speeds up
data searching. Next, exploiting a deep neural network to predict the approximate execution time of a job gives
prioritized job scheduling based on the shortest job first, which reduces the average waiting time of job execution.
As a result, the proposed data retrieval approach outperforms the previous method using a deep autoencoder and
Solr indexing, significantly improving the speed of data retrieval up to 53% and increasing system throughput by
53%. On the other hand, the proposed job scheduling algorithm defeats both first-in-first-out and memory-sensitive
heterogeneous early finish time scheduling algorithms, effectively shortening the average waiting time up to 5% and
average weighted turnaround time by 19%, respectively.},
DOI = {10.32604/cmes.2022.020128}
}