{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:25:18Z","timestamp":1750220718215,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":24,"publisher":"ACM","license":[{"start":{"date-parts":[[2020,6,8]],"date-time":"2020-06-08T00:00:00Z","timestamp":1591574400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"Academia Sinica, Taiwan","award":["AS-TP-107-M05"],"award-info":[{"award-number":["AS-TP-107-M05"]}]},{"DOI":"10.13039\/501100004663","name":"Ministry of Science and Technology, Taiwan","doi-asserted-by":"publisher","award":["MOST-106-2923-E-002-012-MY3, MOST-109-2634-F-002-040-, MOST-109-2634-F-002-034-, MOST-108-2218-E-009-051-"],"award-info":[{"award-number":["MOST-106-2923-E-002-012-MY3, MOST-109-2634-F-002-040-, MOST-109-2634-F-002-034-, MOST-108-2218-E-009-051-"]}],"id":[{"id":"10.13039\/501100004663","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2020,6,8]]},"DOI":"10.1145\/3372278.3390735","type":"proceedings-article","created":{"date-parts":[[2020,6,2]],"date-time":"2020-06-02T04:35:27Z","timestamp":1591072527000},"page":"326-330","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Visual Story Ordering with a Bidirectional Writer"],"prefix":"10.1145","author":[{"given":"Wei-Rou","family":"Lin","sequence":"first","affiliation":[{"name":"National Taiwan University, Taipei City, Taiwan Roc"}]},{"given":"Hen-Hsen","family":"Huang","sequence":"additional","affiliation":[{"name":"National Chengchi University &amp; MOST Joint Research Center for AI Technology and All Vista Healthcare, Taipei City, Taiwan Roc"}]},{"given":"Hsin-Hsi","family":"Chen","sequence":"additional","affiliation":[{"name":"National Chengchi University &amp; MOST Joint Research Center for AI Technology and All Vista Healthcare, Taipei City, Taiwan Roc"}]}],"member":"320","published-online":{"date-parts":[[2020,6,8]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D16-1091"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1613\/jair.991"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1162\/coli.2008.34.1.1"},{"key":"e_1_3_2_1_4_1","first-page":"1","article-title":"A Bottom-up Approach to Sentence Ordering for Multi-document","volume":"46","author":"Bollegala Danushka","year":"2010","unstructured":"Danushka Bollegala , Naoaki Okazaki , and Mitsuru Ishizuka . 2010 . A Bottom-up Approach to Sentence Ordering for Multi-document Summarization. Inf. Process.Manage. 46 , 1 (Jan. 2010), 89--109. https:\/\/doi.org\/10.1016\/j.ipm.2009.07.004 10.1016\/j.ipm.2009.07.004 Danushka Bollegala, Naoaki Okazaki, and Mitsuru Ishizuka. 2010. A Bottom-up Approach to Sentence Ordering for Multi-document Summarization. Inf. Process.Manage.46, 1 (Jan. 2010), 89--109. https:\/\/doi.org\/10.1016\/j.ipm.2009.07.004","journal-title":"Summarization. Inf. Process.Manage."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1177\/073428299601400305"},{"key":"e_1_3_2_1_6_1","unstructured":"Patricia Chisholm. 1970. The Structure of Intellect Theory: Implications for More Meaningful Mental Test Interpretations. (1970).  Patricia Chisholm. 1970. The Structure of Intellect Theory: Implications for More Meaningful Mental Test Interpretations. (1970)."},{"key":"e_1_3_2_1_7_1","unstructured":"Andrea Frome Greg S Corrado Jon Shlens Samy Bengio Jeff Dean Marc'Aurelio Ranzato and Tomas Mikolov. [n.d.]. DeViSE: A Deep Visual-Semantic Embedding Model. In Advances in Neural Information Processing Systems 26.  Andrea Frome Greg S Corrado Jon Shlens Samy Bengio Jeff Dean Marc'Aurelio Ranzato and Tomas Mikolov. [n.d.]. DeViSE: A Deep Visual-Semantic Embedding Model. In Advances in Neural Information Processing Systems 26."},{"key":"e_1_3_2_1_8_1","volume-title":"Proceedings of the 27th International Conference on Neural Information Processing Systems -","volume":"2","author":"Goodfellow Ian J.","year":"2014","unstructured":"Ian J. Goodfellow , Jean Pouget-Abadie , Mehdi Mirza , Bing Xu , David Warde-Farley , Sherjil Ozair , Aaron Courville , and Yoshua Bengio . 2014 . Generative Adversarial Nets . In Proceedings of the 27th International Conference on Neural Information Processing Systems - Volume 2 (NIPS'14). MIT Press, Cambridge, MA,USA, 2672--2680. http:\/\/dl.acm.org\/citation.cfm?id=2969033.2969125 Ian J. Goodfellow, Jean Pouget-Abadie, Mehdi Mirza, Bing Xu, David Warde-Farley, Sherjil Ozair, Aaron Courville, and Yoshua Bengio. 2014. Generative Adversarial Nets. In Proceedings of the 27th International Conference on Neural Information Processing Systems - Volume 2 (NIPS'14). MIT Press, Cambridge, MA,USA, 2672--2680. http:\/\/dl.acm.org\/citation.cfm?id=2969033.2969125"},{"key":"e_1_3_2_1_9_1","volume-title":"Deep Residual Learning for Image Recognition. In2016 IEEE Conference on Computer Vision and Pattern Recognition(CVPR). 770--778","author":"He K.","year":"2016","unstructured":"K. He , X. Zhang , S. Ren , and J. Sun . 2016 . Deep Residual Learning for Image Recognition. In2016 IEEE Conference on Computer Vision and Pattern Recognition(CVPR). 770--778 . https:\/\/doi.org\/10.1109\/CVPR. 2016 .90 10.1109\/CVPR.2016.90 K. He, X. Zhang, S. Ren, and J. Sun. 2016. Deep Residual Learning for Image Recognition. In2016 IEEE Conference on Computer Vision and Pattern Recognition(CVPR). 770--778. https:\/\/doi.org\/10.1109\/CVPR.2016.90"},{"volume-title":"Proceedings of the 2016 Conference of the North American","author":"Huang Ting-Hao","key":"e_1_3_2_1_10_1","unstructured":"Ting-Hao (Kenneth) Huang , Francis Ferraro , Nasrin Mostafazadeh , Ishan Misra , Aishwarya Agrawal , Jacob Devlin , Ross Girshick , Xiaodong He , Pushmeet Kohli , Dhruv Batra , C. Lawrence Zitnick , Devi Parikh , Lucy Vanderwende , Michel Galley , and Margaret Mitchell . 2016. Visual Storytelling . In Proceedings of the 2016 Conference of the North American Chapter of the Association for Computational Linguistics:Human Language Technologies. Association for Computational Linguistics , San Diego , California, 1233--1239. http:\/\/www.aclweb.org\/anthology\/N16--1147 Ting-Hao (Kenneth) Huang, Francis Ferraro, Nasrin Mostafazadeh, Ishan Misra, Aishwarya Agrawal, Jacob Devlin, Ross Girshick, Xiaodong He, Pushmeet Kohli, Dhruv Batra, C. Lawrence Zitnick, Devi Parikh, Lucy Vanderwende, Michel Galley, and Margaret Mitchell. 2016. Visual Storytelling. In Proceedings of the 2016 Conference of the North American Chapter of the Association for Computational Linguistics:Human Language Technologies. Association for Computational Linguistics, San Diego, California, 1233--1239. http:\/\/www.aclweb.org\/anthology\/N16--1147"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2598339"},{"key":"e_1_3_2_1_12_1","volume-title":"Proceedings of the 31st International Conference on Machine Learning. 595--603","author":"Kiros Ryan","year":"2014","unstructured":"Ryan Kiros , Ruslan Salakhutdinov , and Rich Zemel . 2014 . Multimodal Neural Language Models . In Proceedings of the 31st International Conference on Machine Learning. 595--603 . Ryan Kiros, Ruslan Salakhutdinov, and Rich Zemel. 2014. Multimodal Neural Language Models. In Proceedings of the 31st International Conference on Machine Learning. 595--603."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.3115\/1075096.1075165"},{"key":"e_1_3_2_1_14_1","unstructured":"Karen Le. 2015. Narrative and Horticultural Imperative: Predicting Discourse Ability in Traumatic Brain Injury from Cognitive and Communicative Factors.(2015).  Karen Le. 2015. Narrative and Horticultural Imperative: Predicting Discourse Ability in Traumatic Brain Injury from Cognitive and Communicative Factors.(2015)."},{"volume-title":"Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. 4681--4690","author":"Ledig Christian","key":"e_1_3_2_1_15_1","unstructured":"Christian Ledig , Lucas Theis , Ferenc Huszar , Jose Caballero , Andrew Cunning-ham, Alejandro Acosta , Andrew Aitken , Alykhan Tejani , Johannes Totz , Zehan Wang , Photo-Realistic Single Image Super-Resolution Using a Generative Adversarial Network . In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. 4681--4690 . Christian Ledig, Lucas Theis, Ferenc Huszar, Jose Caballero, Andrew Cunning-ham, Alejandro Acosta, Andrew Aitken, Alykhan Tejani, Johannes Totz, Zehan Wang, et al.2017. Photo-Realistic Single Image Super-Resolution Using a Generative Adversarial Network. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. 4681--4690."},{"key":"e_1_3_2_1_16_1","volume-title":"Mo Yu, Bing Xiang, Bowen Zhou, and Yoshua Bengio.","author":"Lin Zhouhan","year":"2017","unstructured":"Zhouhan Lin , Minwei Feng , Cicero Nogueira dos Santos , Mo Yu, Bing Xiang, Bowen Zhou, and Yoshua Bengio. 2017 . A structured self-attentive sentence embedding. arXiv preprint arXiv:1703.03130(2017). Zhouhan Lin, Minwei Feng, Cicero Nogueira dos Santos, Mo Yu, Bing Xiang, Bowen Zhou, and Yoshua Bengio. 2017. A structured self-attentive sentence embedding. arXiv preprint arXiv:1703.03130(2017)."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"crossref","unstructured":"Lajanugen Logeswaran Honglak Lee and Dragomir Radev. 2018. Sentence Ordering and Coherence Modeling using Recurrent Neural Networks. https:\/\/www.aaai.org\/ocs\/index.php\/AAAI\/AAAI18\/paper\/view\/17011  Lajanugen Logeswaran Honglak Lee and Dragomir Radev. 2018. Sentence Ordering and Coherence Modeling using Recurrent Neural Networks. https:\/\/www.aaai.org\/ocs\/index.php\/AAAI\/AAAI18\/paper\/view\/17011","DOI":"10.1609\/aaai.v32i1.11997"},{"key":"e_1_3_2_1_18_1","volume-title":"Proceedings of the32Nd International Conference on International Conference on Machine Learning-","volume":"37","author":"Srivastava Nitish","year":"2015","unstructured":"Nitish Srivastava , Elman Mansimov , and Ruslan Salakhutdinov . 2015 . Unsupervised Learning of Video Representations Using LSTMs . In Proceedings of the32Nd International Conference on International Conference on Machine Learning- Volume 37 (ICML'15). JMLR.org, 843--852. http:\/\/dl.acm.org\/citation.cfm?id=3045118.3045209 Nitish Srivastava, Elman Mansimov, and Ruslan Salakhutdinov. 2015. Unsupervised Learning of Video Representations Using LSTMs. In Proceedings of the32Nd International Conference on International Conference on Machine Learning- Volume 37 (ICML'15). JMLR.org, 843--852. http:\/\/dl.acm.org\/citation.cfm?id=3045118.3045209"},{"key":"e_1_3_2_1_19_1","volume-title":"Bidirectional Beam Search: Forward-Backward Inference in Neural Sequence Models for Fill-In-The-Blank Image Captioning. In The IEEE Conference on Computer Vision and Pattern Recognition(CVPR).","author":"Sun Qing","year":"2017","unstructured":"Qing Sun , Stefan Lee , and Dhruv Batra . 2017 . Bidirectional Beam Search: Forward-Backward Inference in Neural Sequence Models for Fill-In-The-Blank Image Captioning. In The IEEE Conference on Computer Vision and Pattern Recognition(CVPR). Qing Sun, Stefan Lee, and Dhruv Batra. 2017. Bidirectional Beam Search: Forward-Backward Inference in Neural Sequence Models for Fill-In-The-Blank Image Captioning. In The IEEE Conference on Computer Vision and Pattern Recognition(CVPR)."},{"key":"e_1_3_2_1_20_1","unstructured":"Oriol Vinyals Samy Bengio and Manjunath Kudlur. 2015. Order matters: Sequence to sequence for sets.arXiv preprint arXiv:1511.06391(2015).  Oriol Vinyals Samy Bengio and Manjunath Kudlur. 2015. Order matters: Sequence to sequence for sets.arXiv preprint arXiv:1511.06391(2015)."},{"key":"e_1_3_2_1_21_1","unstructured":"Oriol Vinyals Meire Fortunato and Navdeep Jaitly. [n.d.]. Pointer Networks. In Advances in Neural Information Processing Systems 28.  Oriol Vinyals Meire Fortunato and Navdeep Jaitly. [n.d.]. Pointer Networks. In Advances in Neural Information Processing Systems 28."},{"key":"e_1_3_2_1_22_1","volume-title":"Wsabie: Scaling Up to Large Vocabulary Image Annotation. https:\/\/www.aaai.org\/ocs\/index.php\/IJCAI\/IJCAI11\/paper\/view\/2926","author":"Weston Jason","year":"2011","unstructured":"Jason Weston , Samy Bengio , and Nicolas Usunier . 2011 . Wsabie: Scaling Up to Large Vocabulary Image Annotation. https:\/\/www.aaai.org\/ocs\/index.php\/IJCAI\/IJCAI11\/paper\/view\/2926 Jason Weston, Samy Bengio, and Nicolas Usunier. 2011. Wsabie: Scaling Up to Large Vocabulary Image Annotation. https:\/\/www.aaai.org\/ocs\/index.php\/IJCAI\/IJCAI11\/paper\/view\/2926"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.326"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2019.2893499"}],"event":{"name":"ICMR '20: International Conference on Multimedia Retrieval","sponsor":["SIGMM ACM Special Interest Group on Multimedia"],"location":"Dublin Ireland","acronym":"ICMR '20"},"container-title":["Proceedings of the 2020 International Conference on Multimedia Retrieval"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3372278.3390735","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3372278.3390735","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T22:33:25Z","timestamp":1750199605000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3372278.3390735"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,6,8]]},"references-count":24,"alternative-id":["10.1145\/3372278.3390735","10.1145\/3372278"],"URL":"https:\/\/doi.org\/10.1145\/3372278.3390735","relation":{},"subject":[],"published":{"date-parts":[[2020,6,8]]},"assertion":[{"value":"2020-06-08","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}