{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T00:41:26Z","timestamp":1755823286034,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":46,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,10,26]],"date-time":"2023-10-26T00:00:00Z","timestamp":1698278400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,10,26]]},"DOI":"10.1145\/3581783.3612573","type":"proceedings-article","created":{"date-parts":[[2023,10,27]],"date-time":"2023-10-27T07:26:54Z","timestamp":1698391614000},"page":"8114-8124","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":2,"title":["Handwritten Chemical Structure Image to Structure-Specific Markup Using Random Conditional Guided Decoder"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0001-3017-973X","authenticated-orcid":false,"given":"Jinshui","family":"Hu","sequence":"first","affiliation":[{"name":"University of Science and Technology of China, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-3041-7253","authenticated-orcid":false,"given":"Hao","family":"Wu","sequence":"additional","affiliation":[{"name":"iFLYTEK Research, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-9329-6992","authenticated-orcid":false,"given":"Mingjun","family":"Chen","sequence":"additional","affiliation":[{"name":"iFLYTEK Research, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-6682-2877","authenticated-orcid":false,"given":"Chenyu","family":"Liu","sequence":"additional","affiliation":[{"name":"iFLYTEK Research, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0951-4281","authenticated-orcid":false,"given":"Jiajia","family":"Wu","sequence":"additional","affiliation":[{"name":"iFLYTEK Research, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8114-2235","authenticated-orcid":false,"given":"Shi","family":"Yin","sequence":"additional","affiliation":[{"name":"iFLYTEK Research, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4164-6647","authenticated-orcid":false,"given":"Baocai","family":"Yin","sequence":"additional","affiliation":[{"name":"iFLYTEK Research, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4042-7522","authenticated-orcid":false,"given":"Bing","family":"Yin","sequence":"additional","affiliation":[{"name":"iFLYTEK Research, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-0328-423X","authenticated-orcid":false,"given":"Cong","family":"Liu","sequence":"additional","affiliation":[{"name":"iFLYTEK Research, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2387-0389","authenticated-orcid":false,"given":"Jun","family":"Du","sequence":"additional","affiliation":[{"name":"University of Science and Technology of China, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0859-2827","authenticated-orcid":false,"given":"Lirong","family":"Dai","sequence":"additional","affiliation":[{"name":"University of Science and Technology of China, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2023,10,27]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i1.19885"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"e_1_3_2_1_3_1","unstructured":"Junyoung Chung Caglar Gulcehre Kyunghyun Cho and Yoshua Bengio. 2014. Empirical evaluation of gated recurrent neural networks on sequence modeling."},{"key":"e_1_3_2_1_4_1","volume-title":"Img2Mol-accurate SMILES recognition from molecular graphical depictions. Chemical science","author":"Clevert Djork-Arn\u00e9","year":"2021","unstructured":"Djork-Arn\u00e9 Clevert, Tuan Le, Robin Winter, and Floriane Montanari. 2021. Img2Mol-accurate SMILES recognition from molecular graphical depictions. Chemical science, Vol. 12, 42 (2021), 14174--14181."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"crossref","unstructured":"Longfei Ding Mengbiao Zhao Fei Yin Shuiling Zeng and Cheng-Lin Liu. 2022. A Large-Scale Database for Chemical Structure Recognition and Preliminary Evaluation. In ICPR. 1464--1470.","DOI":"10.1109\/ICPR56361.2022.9956654"},{"key":"e_1_3_2_1_6_1","unstructured":"Alexey Dosovitskiy Lucas Beyer Alexander Kolesnikov Dirk Weissenborn Xiaohua Zhai Thomas Unterthiner Mostafa Dehghani Matthias Minderer Georg Heigold Sylvain Gelly et al. 2020. An image is worth 16x16 words: Transformers for image recognition at scale. arXiv preprint arXiv:2010.11929 (2020)."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"crossref","unstructured":"Anna Gaulton Anne Hersey Michal Nowotka A.Patr\u00edcia Bento Jon Chambers David Mendez Prudence Mutowo Francis Atkinson LouisaJ. Bellis Elena Cibrian-Uhalte and et al. 2017. The ChEMBL database in 2017. Nucleic Acids Research (Jan 2017).","DOI":"10.1093\/nar\/gkw1074"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2022.3152247"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1186\/1758-2946-5-7"},{"volume-title":"Densely Connected Convolutional Networks. In 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR).","author":"Huang Gao","key":"e_1_3_2_1_10_1","unstructured":"Gao Huang, Zhuang Liu, Laurens Van Der Maaten, and Kilian Q. Weinberger. 2017. Densely Connected Convolutional Networks. In 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01761"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"crossref","unstructured":"Alexander Kirillov Eric Mintun Nikhila Ravi Hanzi Mao Chloe Rolland Laura Gustafson Tete Xiao Spencer Whitehead Alexander C Berg Wan-Yen Lo et al. 2023. Segment anything. arXiv preprint arXiv:2304.02643 (2023).","DOI":"10.1109\/ICCV51070.2023.00371"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"crossref","unstructured":"Craig Knox Vivian Law Timothy Jewison Philip Liu Son Ly Alex Frolkis Allison Pon Kelly Banco Christine Mak Vanessa Neveu and et al. 2011. DrugBank 3.0: a comprehensive resource for ?Omics' research on drugs. Nucleic Acids Research (2011).","DOI":"10.1093\/nar\/gkq1126"},{"key":"e_1_3_2_1_14_1","first-page":"197","article-title":"When Counting Meets HMER: Counting-Aware Network for Handwritten Mathematical Expression Recognition","volume":"13688","author":"Li Bohan","year":"2022","unstructured":"Bohan Li, Ye Yuan, Dingkang Liang, Xiao Liu, Zhilong Ji, Jinfeng Bai, Wenyu Liu, and Xiang Bai. 2022a. When Counting Meets HMER: Counting-Aware Network for Handwritten Mathematical Expression Recognition. In ECCV, Vol. 13688. 197--214.","journal-title":"ECCV"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01325"},{"key":"e_1_3_2_1_16_1","volume-title":"PubChem as a public resource for drug discovery. Drug Discovery Today (Dec","author":"Li Qingliang","year":"2010","unstructured":"Qingliang Li, Tiejun Cheng, Yanli Wang, and StephenH. Bryant. 2010. PubChem as a public resource for drug discovery. Drug Discovery Today (Dec 2010)."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01633"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00363"},{"key":"e_1_3_2_1_21_1","unstructured":"Eugenia Namiot. 2019. Using LaTeX for chemical formulas."},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1021\/acs.jcim.0c00459"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1021\/acs.jcim.2c01480"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1186\/s13321-020-00465-0"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1021\/acs.jcim.8b00669"},{"key":"e_1_3_2_1_26_1","unstructured":"Ashish Vaswani Noam Shazeer Niki Parmar Jakob Uszkoreit Llion Jones Aidan N. Gomez Lukasz Kaiser and Illia Polosukhin. 2017. Attention is All you Need. In NeurIPS. 5998--6008."},{"key":"e_1_3_2_1_27_1","volume-title":"Conference on Robot Learning. PMLR, 1475--1485","author":"Wang Tai","year":"2022","unstructured":"Tai Wang, ZHU Xinge, Jiangmiao Pang, and Dahua Lin. 2022a. Probabilistic and geometric depth: Detecting objects in perspective. In Conference on Robot Learning. PMLR, 1475--1485."},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW54120.2021.00107"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01131"},{"key":"e_1_3_2_1_30_1","article-title":"SMILES, a chemical language and information system. 1. introduction to methodology and encoding rules","author":"Weininger David","year":"1988","unstructured":"David Weininger. 1988. SMILES, a chemical language and information system. 1. introduction to methodology and encoding rules. Journal of Chemical Information and Modeling (Feb 1988).","journal-title":"Journal of Chemical Information and Modeling"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1039\/C8SC04175J"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i3.20172"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"crossref","unstructured":"Jiajia Wu Jinshui Hu Mingjun Chen Lirong Dai Xuejing Niu and Ning Wang. 2022b. Structural String Decoder for Handwritten Mathematical Expression Recognition. In ICPR. 3246--3251.","DOI":"10.1109\/ICPR56361.2022.9956105"},{"key":"e_1_3_2_1_34_1","volume-title":"Handwritten Mathematical Expression Recognition via Paired Adversarial Learning. IJCV","author":"Wu Jin-Wen","year":"2020","unstructured":"Jin-Wen Wu, Fei Yin, Yan-Ming Zhang, Xu-Yao Zhang, and Cheng-Lin Liu. 2020. Handwritten Mathematical Expression Recognition via Paired Adversarial Learning. IJCV (2020)."},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1021\/acs.jcim.2c00733"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01161"},{"key":"e_1_3_2_1_37_1","volume-title":"Object-Contextual Representations for Semantic Segmentation. arXiv preprint arXiv:1909.11065","author":"Yuan Yuhui","year":"2019","unstructured":"Yuhui Yuan, Xilin Chen, and Jingdong Wang. 2019. Object-Contextual Representations for Semantic Segmentation. arXiv preprint arXiv:1909.11065 (2019)."},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"crossref","unstructured":"Ye Yuan Xiao Liu Wondimu Dikubab Hui Liu Zhilong Ji Zhongqin Wu and Xiang Bai. 2022a. Syntax-Aware Network for Handwritten Mathematical Expression Recognition. In CVPR. 4543--4552.","DOI":"10.1109\/CVPR52688.2022.00451"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00451"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1038\/s42256-022-00557-6"},{"key":"e_1_3_2_1_41_1","volume-title":"International Conference on Machine Learning. PMLR, 11076--11085","author":"Zhang Jianshu","year":"2020","unstructured":"Jianshu Zhang, Jun Du, Yongxin Yang, Yi-Zhe Song, Si Wei, and Lirong Dai. 2020. A tree-structured decoder for image-to-markup generation. In International Conference on Machine Learning. PMLR, 11076--11085."},{"key":"e_1_3_2_1_42_1","volume-title":"attend and parse: An end-to-end neural network based approach to handwritten mathematical expression recognition. PR","author":"Zhang Jianshu","year":"2017","unstructured":"Jianshu Zhang, Jun Du, Shiliang Zhang, Dan Liu, Yulong Hu, Jinshui Hu, Si Wei, and Lirong Dai. 2017. Watch, attend and parse: An end-to-end neural network based approach to handwritten mathematical expression recognition. PR (2017)."},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01641"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-86331-9_37"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3548424"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00261"}],"event":{"name":"MM '23: The 31st ACM International Conference on Multimedia","sponsor":["SIGMM ACM Special Interest Group on Multimedia"],"location":"Ottawa ON Canada","acronym":"MM '23"},"container-title":["Proceedings of the 31st ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3581783.3612573","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3581783.3612573","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T23:59:08Z","timestamp":1755820748000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3581783.3612573"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10,26]]},"references-count":46,"alternative-id":["10.1145\/3581783.3612573","10.1145\/3581783"],"URL":"https:\/\/doi.org\/10.1145\/3581783.3612573","relation":{},"subject":[],"published":{"date-parts":[[2023,10,26]]},"assertion":[{"value":"2023-10-27","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}