
@Article{jnm.2022.027890,
AUTHOR = {Xiaoyu, Tian Zhenzhen, Xin Zihao, Liu Suolan, Chen Fuhua, Wang Hongyuan},
TITLE = {Menu Text Recognition of Few-shot Learning},
JOURNAL = {Journal of New Media},
VOLUME = {4},
YEAR = {2022},
NUMBER = {3},
PAGES = {137--143},
URL = {http://www.techscience.com/JNM/v4n3/48202},
ISSN = {2579-0129},
ABSTRACT = {Recent advances in OCR show that end-to-end (E2E) training pipelines including detection and identification can achieve the best results. However, many existing methods usually focus on case insensitive English characters. In this paper, we apply an E2E approach, the multiplex multilingual mask TextSpotter, which performs script recognition at the word level and uses different recognition headers to process different scripts while maintaining uniform loss, thus optimizing script recognition and multiple recognition headers simultaneously. Experiments show that this method is superior to the single-head model with similar number of parameters in end-to-end identification tasks.},
DOI = {10.32604/jnm.2022.027890}
}



