@Article{cmc.2020.06478, AUTHOR = {Dongjie Zhu, Haiwen Du, Yundong Sun, Xiaofang Li, Rongning Qu, Hao Hu, Shuangshuang Dong, Helen Min Zhou, Ning Cao,}, TITLE = {Massive Files Prefetching Model Based on LSTM Neural Network with Cache Transaction Strategy}, JOURNAL = {Computers, Materials \& Continua}, VOLUME = {63}, YEAR = {2020}, NUMBER = {2}, PAGES = {979--993}, URL = {http://www.techscience.com/cmc/v63n2/38555}, ISSN = {1546-2226}, ABSTRACT = {In distributed storage systems, file access efficiency has an important impact on the real-time nature of information forensics. As a popular approach to improve file accessing efficiency, prefetching model can fetches data before it is needed according to the file access pattern, which can reduce the I/O waiting time and increase the system concurrency. However, prefetching model needs to mine the degree of association between files to ensure the accuracy of prefetching. In the massive small file situation, the sheer volume of files poses a challenge to the efficiency and accuracy of relevance mining. In this paper, we propose a massive files prefetching model based on LSTM neural network with cache transaction strategy to improve file access efficiency. Firstly, we propose a file clustering algorithm based on temporal locality and spatial locality to reduce the computational complexity. Secondly, we propose a definition of cache transaction according to files occurrence in cache instead of time-offset distance based methods to extract file block feature accurately. Lastly, we innovatively propose a file access prediction algorithm based on LSTM neural network which predict the file that have high possibility to be accessed. Experiments show that compared with the traditional LRU and the plain grouping methods, the proposed model notably increase the cache hit rate and effectively reduces the I/O wait time.}, DOI = {10.32604/cmc.2020.06478} }