{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T15:56:45Z","timestamp":1781539005508,"version":"3.54.5"},"publisher-location":"New York, NY, USA","reference-count":40,"publisher":"ACM","license":[{"start":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T00:00:00Z","timestamp":1781481600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62577041"],"award-info":[{"award-number":["62577041"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Outstanding Youth Science Foundation of Shaanxi Province","award":["2025JC-JCQN-083"],"award-info":[{"award-number":["2025JC-JCQN-083"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62577041"],"award-info":[{"award-number":["62577041"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Natural Science Foundation of Xi'an","award":["2025JH-ZRKX-0540"],"award-info":[{"award-number":["2025JH-ZRKX-0540"]}]},{"name":"Key Research and Development Program of Shaanxi Province","award":["2025CY-YBXM-047"],"award-info":[{"award-number":["2025CY-YBXM-047"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62192730"],"award-info":[{"award-number":["62192730"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"National Natural Science Foundation of China","award":["62192734"],"award-info":[{"award-number":["62192734"]}]},{"name":"CCF-Huawei Populus Grove Fund","award":["CCF-Huawei Populus Grove Fund"],"award-info":[{"award-number":["CCF-Huawei Populus Grove Fund"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2026,6,16]]},"DOI":"10.1145\/3805622.3810801","type":"proceedings-article","created":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T14:42:57Z","timestamp":1781534577000},"page":"1803-1811","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["VideoAgent: Personalized Synthesis of Scientific Videos"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-0382-2715","authenticated-orcid":false,"given":"Xiao","family":"Liang","sequence":"first","affiliation":[{"name":"Xidian University, Xian, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0409-9194","authenticated-orcid":false,"given":"Bangxin","family":"Li","sequence":"additional","affiliation":[{"name":"Xidian University, Xian, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-0770-566X","authenticated-orcid":false,"given":"Zixuan","family":"Chen","sequence":"additional","affiliation":[{"name":"Xidian University, Xian, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-3538-432X","authenticated-orcid":false,"given":"Hanyue","family":"Zheng","sequence":"additional","affiliation":[{"name":"Xidian University, Xian, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-2045-4822","authenticated-orcid":false,"given":"Zhi","family":"Ma","sequence":"additional","affiliation":[{"name":"Xidian University, Xian, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8027-4287","authenticated-orcid":false,"given":"Di","family":"Wang","sequence":"additional","affiliation":[{"name":"Xidian University, Xian, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5429-4580","authenticated-orcid":false,"given":"Cong","family":"Tian","sequence":"additional","affiliation":[{"name":"Xidian University, Xian, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6913-8604","authenticated-orcid":false,"given":"Quan","family":"Wang","sequence":"additional","affiliation":[{"name":"Xidian University, Xian, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2026,6,15]]},"reference":[{"key":"e_1_3_3_1_2_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2501.06497"},{"key":"e_1_3_3_1_3_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2502.13923"},{"key":"e_1_3_3_1_4_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2511.15253"},{"key":"e_1_3_3_1_5_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-acl.552"},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2508.21720"},{"key":"e_1_3_3_1_7_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2507.06261"},{"key":"e_1_3_3_1_8_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2507.05595"},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"publisher","DOI":"10.5555\/3001460.3001507"},{"key":"e_1_3_3_1_10_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i1.19943"},{"key":"e_1_3_3_1_11_2","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-9996"},{"key":"e_1_3_3_1_12_2","volume-title":"Google NotebookLM","year":"2026","unstructured":"Google. 2026. Google NotebookLM. Retrieved April 20, 2026 from https:\/\/notebooklm.google\/"},{"key":"e_1_3_3_1_13_2","volume-title":"Gemini-2.5-Flash-Image (Nano Banana)","author":"DeepMind Google","year":"2025","unstructured":"Google DeepMind. 2025. Gemini-2.5-Flash-Image (Nano Banana). Google DeepMind, London, UK. https:\/\/deepmind.google\/models\/gemini-image\/ Model codenamed Nano Banana."},{"key":"e_1_3_3_1_14_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2410.21276"},{"key":"e_1_3_3_1_15_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.acl-long.332"},{"key":"e_1_3_3_1_16_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2512.04529"},{"key":"e_1_3_3_1_17_2","first-page":"74","volume-title":"Text Summarization Branches Out","author":"Lin Chin-Yew","year":"2004","unstructured":"Chin-Yew Lin. 2004. ROUGE: A Package for Automatic Evaluation of Summaries. In Text Summarization Branches Out (Barcelona, Spain). Association for Computational Linguistics, Stroudsburg, PA, USA, 74\u201381. https:\/\/aclanthology.org\/W04-1013"},{"key":"e_1_3_3_1_18_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2501.17887"},{"key":"e_1_3_3_1_19_2","volume-title":"LunWenShuo","year":"2026","unstructured":"LunWenShuo. 2026. LunWenShuo. Retrieved April 20, 2026 from https:\/\/lunwenshuo.com\/"},{"key":"e_1_3_3_1_20_2","doi-asserted-by":"publisher","DOI":"10.1109\/ASE63991.2025.00104"},{"key":"e_1_3_3_1_21_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-emnlp.936"},{"key":"e_1_3_3_1_22_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2507.14306"},{"key":"e_1_3_3_1_23_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2505.21497"},{"key":"e_1_3_3_1_24_2","volume-title":"Marker: Convert PDF to markdown + JSON quickly with high accuracy","author":"Paruchuri Vik","year":"2023","unstructured":"Vik Paruchuri. 2023. Marker: Convert PDF to markdown + JSON quickly with high accuracy. Datalab. https:\/\/github.com\/VikParuchuri\/marker"},{"key":"e_1_3_3_1_25_2","volume-title":"AI-Powered Video Generator","year":"2026","unstructured":"Pictory. 2026. AI-Powered Video Generator. Retrieved April 20, 2026 from https:\/\/pictory.ai\/video-generator"},{"key":"e_1_3_3_1_26_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v30i1.10000"},{"key":"e_1_3_3_1_27_2","doi-asserted-by":"publisher","DOI":"10.5555\/3618408.3619590"},{"key":"e_1_3_3_1_28_2","volume-title":"Language Models are Unsupervised Multitask Learners","author":"Radford Alec","year":"2019","unstructured":"Alec Radford, Jeff Wu, Rewon Child, David Luan, Dario Amodei, and Ilya Sutskever. 2019. Language Models are Unsupervised Multitask Learners. Technical Report. OpenAI, San Francisco, CA, USA. https:\/\/cdn.openai.com\/better-language-models\/language_models_are_unsupervised_multitask_learners.pdf"},{"key":"e_1_3_3_1_29_2","doi-asserted-by":"publisher","unstructured":"Sara Salzmann Charlotte Walther and Kai Kaspar. 2025. A new dimension of simplified science communication: the easiness effect of science popularization in animated video abstracts. Frontiers in Psychology 16 Article 1584695 (2025). 10.3389\/fpsyg.2025.1584695","DOI":"10.3389\/fpsyg.2025.1584695"},{"key":"e_1_3_3_1_30_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2502.17540"},{"key":"e_1_3_3_1_31_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.emnlp-demos.58"},{"key":"e_1_3_3_1_32_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.naacl-main.111"},{"key":"e_1_3_3_1_33_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2510.18234"},{"key":"e_1_3_3_1_34_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v40i48.42124"},{"key":"e_1_3_3_1_35_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i11.21738"},{"key":"e_1_3_3_1_36_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.findings-emnlp.165"},{"key":"e_1_3_3_1_37_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2509.11062"},{"key":"e_1_3_3_1_38_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v40i41.40758"},{"key":"e_1_3_3_1_39_2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2508.17188"},{"key":"e_1_3_3_1_40_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.emnlp-main.728"},{"key":"e_1_3_3_1_41_2","volume-title":"MoviePy: Video editing with Python","author":"Zulko Florian","year":"2015","unstructured":"Florian Zulko. 2015. MoviePy: Video editing with Python. https:\/\/github.com\/Zulko\/moviepy"}],"event":{"name":"ICMR '26: International Conference on Multimedia Retrieval","location":"Amsterdam The Netherlands","acronym":"ICMR '26","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 2026 International Conference on Multimedia Retrieval"],"original-title":[],"deposited":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T15:31:50Z","timestamp":1781537510000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3805622.3810801"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,6,15]]},"references-count":40,"alternative-id":["10.1145\/3805622.3810801","10.1145\/3805622"],"URL":"https:\/\/doi.org\/10.1145\/3805622.3810801","relation":{},"subject":[],"published":{"date-parts":[[2026,6,15]]},"assertion":[{"value":"2026-06-15","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}