{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,1,26]],"date-time":"2024-01-26T00:08:17Z","timestamp":1706227697122},"reference-count":56,"publisher":"SPIE-Intl Soc Optical Eng","issue":"02","funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62105196"],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["J. Electron. Imag."],"published-print":{"date-parts":[[2023,3,19]]},"DOI":"10.1117\/1.jei.32.2.023015","type":"journal-article","created":{"date-parts":[[2023,3,19]],"date-time":"2023-03-19T16:30:15Z","timestamp":1679243415000},"source":"Crossref","is-referenced-by-count":0,"title":["Multilingual semantic fusion network for text recognition in the wild"],"prefix":"10.1117","volume":"32","author":[{"given":"Celi","family":"Lou","sequence":"first","affiliation":[{"name":"Shanghai University of Electric Power, College of Electronics and Information Engineering, Shanghai, China"}]},{"given":"Minglei","family":"Tong","sequence":"additional","affiliation":[{"name":"Shanghai University of Electric Power, College of Electronics and Information Engineering, Shanghai, China"}]},{"given":"Liang","family":"Xue","sequence":"additional","affiliation":[{"name":"Shanghai University of Electric Power, College of Electronics and Information Engineering, Shanghai, China"}]},{"given":"Sisil","family":"Kumarawadu","sequence":"additional","affiliation":[{"name":"University of Moratuwa, Department of Electrical Engineering, Moratuwa, Sri Lanka"}]}],"member":"189","reference":[{"key":"r1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2019.00102"},{"key":"r2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00295"},{"key":"r3","doi-asserted-by":"publisher","DOI":"10.1145\/3440756"},{"key":"r4","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2020.03.001"},{"key":"r5","doi-asserted-by":"publisher","DOI":"10.1007\/s11042-020-09862-x"},{"key":"r6","doi-asserted-by":"publisher","DOI":"10.1007\/s11220-021-00356-0"},{"key":"r7","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58598-3_40"},{"key":"r8","first-page":"3163","article-title":"R3Det: refined single-stage detector with feature refinement for rotating object","author":"Yang","year":"2021"},{"key":"r9","doi-asserted-by":"publisher","DOI":"10.1117\/1.JEI.27.3.033032"},{"key":"r10","doi-asserted-by":"publisher","DOI":"10.1117\/12.2604527"},{"key":"r11","doi-asserted-by":"publisher","DOI":"10.1117\/1.JEI.31.4.043051"},{"key":"r12","doi-asserted-by":"publisher","DOI":"10.1016\/j.procs.2022.01.185"},{"key":"r13","doi-asserted-by":"crossref","DOI":"10.1609\/aaai.v30i1.10465","article-title":"Reading scene text in deep convolutional sequences","author":"He","year":"2016"},{"key":"r14","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2646371"},{"key":"r15","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2020.07.027"},{"key":"r16","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2848939"},{"key":"r17","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2020.107692"},{"key":"r18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00730"},{"key":"r19","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"r20","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2020.07.010"},{"key":"r21","article-title":"2D attentional irregular scene text recognizer","author":"Lyu","year":"2019"},{"key":"r22","doi-asserted-by":"crossref","DOI":"10.1109\/ICDAR.2019.00130","article-title":"NRTR: a no-recurrence sequence-to-sequence model for scene text recognition","author":"Sheng","year":"2019"},{"key":"r23","article-title":"An image is worth 16 \u00d7 16 words: transformers for image recognition at scale","author":"Dosovitskiy","year":"2021"},{"key":"r24","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2021.07.016"},{"key":"r25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01213"},{"key":"r26","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01467"},{"key":"r27","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00702"},{"key":"r28","article-title":"Cross-lingual language model pretraining","author":"Conneau","year":"2019"},{"key":"r29","doi-asserted-by":"crossref","DOI":"10.1145\/1143844.1143891","article-title":"Connectionist temporal classification: labelling unsegmented sequence data with recurrent neural networks","author":"Graves","year":"2006"},{"key":"r30","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.543"},{"key":"r31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.452"},{"key":"r32","article-title":"Bert: pre-training of deep bidirectional transformers for language understanding","author":"Devlin","year":"2018"},{"key":"r33","article-title":"Attention is all you need","author":"Vaswani","year":"2017"},{"key":"r34","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW50498.2020.00281"},{"key":"r35","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-86549-8_21"},{"key":"r36","article-title":"TrOCR: transformer-based optical character recognition with pre-trained models","author":"Li","year":"2021"},{"key":"r37","article-title":"Toward multilingual neural machine translation with universal encoder and decoder","author":"Ha","year":"2016"},{"key":"r38","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00065"},{"key":"r39","article-title":"Synthetic data and artificial neural networks for natural scene text recognition","author":"Jaderberg","year":"2014"},{"key":"r40","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.254"},{"key":"r41","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-86337-1_8"},{"key":"r42","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-86337-1_40"},{"key":"r43","doi-asserted-by":"publisher","DOI":"10.5244\/C.26.127"},{"key":"r44","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2011.6126402"},{"key":"r45","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2013.221"},{"key":"r46","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2015.7333942"},{"key":"r47","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.76"},{"key":"r48","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2014.07.008"},{"key":"r49","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58529-7_9"},{"key":"r50","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2020.06.009"},{"key":"r51","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR48806.2021.9412037"},{"key":"r52","doi-asserted-by":"crossref","DOI":"10.1145\/3474085.3475238","article-title":"PIMNet: a parallel, iterative and mimicking network for scene text recognition","author":"Qiao","year":"2021"},{"key":"r53","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01393"},{"key":"r54","doi-asserted-by":"publisher","DOI":"10.1155\/2022\/2996862"},{"key":"r55","doi-asserted-by":"publisher","DOI":"10.1007\/s10032-022-00398-4"},{"key":"r56","doi-asserted-by":"publisher","DOI":"10.1007\/s10489-022-04241-5"}],"container-title":["Journal of Electronic Imaging"],"original-title":[],"link":[{"URL":"https:\/\/www.spiedigitallibrary.org\/journalArticle\/Download?urlId=10.1117%2f1.JEI.32.2.023015","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,25]],"date-time":"2024-01-25T20:03:02Z","timestamp":1706212982000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.spiedigitallibrary.org\/journals\/journal-of-electronic-imaging\/volume-32\/issue-02\/023015\/Multilingual-semantic-fusion-network-for-text-recognition-in-the-wild\/10.1117\/1.JEI.32.2.023015.full"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,3,19]]},"references-count":56,"journal-issue":{"issue":"02","published-online":{"date-parts":[[2023,3,1]]}},"URL":"https:\/\/doi.org\/10.1117\/1.jei.32.2.023015","relation":{},"ISSN":["1017-9909"],"issn-type":[{"value":"1017-9909","type":"print"}],"subject":[],"published":{"date-parts":[[2023,3,19]]}}}