{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,11]],"date-time":"2026-04-11T21:03:42Z","timestamp":1775941422402,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":43,"publisher":"ACM","funder":[{"name":"JSPS KAKENHI Grant","award":["24K02962"],"award-info":[{"award-number":["24K02962"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,3,16]]},"DOI":"10.1145\/3745900.3746066","type":"proceedings-article","created":{"date-parts":[[2025,10,9]],"date-time":"2025-10-09T11:36:08Z","timestamp":1760009768000},"page":"289-301","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":5,"title":["GenAIReading: Augmenting Human Cognition with Interactive Digital Textbooks Using Large Language Models and Image Generation Models"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0007-6324-9291","authenticated-orcid":false,"given":"Ryugo","family":"Morita","sequence":"first","affiliation":[{"name":"Hosei University\/DFKI GmbH, Tokyo, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2031-9142","authenticated-orcid":false,"given":"Ko","family":"Watanabe","sequence":"additional","affiliation":[{"name":"DFKI GmbH, Kaiserslautern, Germany"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5078-0522","authenticated-orcid":false,"given":"Jinjia","family":"Zhou","sequence":"additional","affiliation":[{"name":"Hosei University, Tokyo, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6100-8255","authenticated-orcid":false,"given":"Andreas","family":"Dengel","sequence":"additional","affiliation":[{"name":"DFKI GmbH, Kaiserslautern, Germany"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5374-1510","authenticated-orcid":false,"given":"Shoya","family":"Ishimaru","sequence":"additional","affiliation":[{"name":"Osaka Metropolitan University, Osaka, Japan"}]}],"member":"320","published-online":{"date-parts":[[2025,10,9]]},"reference":[{"key":"e_1_3_3_2_2_2","doi-asserted-by":"crossref","unstructured":"Farhan Ali Doris Choy Shanti Divaharan Hui\u00a0Yong Tay and Wenli Chen. 2023. Supporting self-directed learning and self-assessment using TeacherGAIA a generative AI chatbot application: Learning approaches and prompt engineering. Learning: Research and Practice 9 2 (2023) 135\u2013147.","DOI":"10.1080\/23735082.2023.2258886"},{"key":"e_1_3_3_2_3_2","doi-asserted-by":"crossref","unstructured":"Richard\u00a0C Atkinson. 1968. Human memory: A proposed system and its control processes. The Psychology of Learning and Motivation 2 (1968).","DOI":"10.1016\/S0079-7421(08)60422-3"},{"key":"e_1_3_3_2_4_2","doi-asserted-by":"publisher","DOI":"10.1145\/1358628.1358796"},{"key":"e_1_3_3_2_5_2","doi-asserted-by":"crossref","unstructured":"Russell\u00a0N. Carney and Joel\u00a0R. Levin. 2002. Pictorial illustrations still improve students\u2019 learning from text. Educational Psychology Review 14 1 (2002) 5\u201326.","DOI":"10.1023\/A:1013176309260"},{"key":"e_1_3_3_2_6_2","doi-asserted-by":"crossref","unstructured":"Sarah Clinch and Jamie\u00a0A Ward. 2023. Augmented Cognition. IEEE Pervasive Computing 22 3 (2023) 6\u20137.","DOI":"10.1109\/MPRV.2023.3296010"},{"key":"e_1_3_3_2_7_2","doi-asserted-by":"crossref","unstructured":"Fergus I.\u00a0M. Craik and Robert\u00a0S. Lockhart. 1972. Levels of processing: A framework for memory research. Journal of Verbal Learning and Verbal Behavior 11 6 (1972) 671\u2013684.","DOI":"10.1016\/S0022-5371(72)80001-X"},{"key":"e_1_3_3_2_8_2","doi-asserted-by":"publisher","DOI":"10.1145\/3519391.3524169"},{"key":"e_1_3_3_2_9_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613905.3651118"},{"key":"e_1_3_3_2_10_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642129"},{"key":"e_1_3_3_2_11_2","unstructured":"Soheil Feizi MohammadTaghi Hajiaghayi Keivan Rezaei and Suho Shin. 2023. Online Advertisements with LLMs: Opportunities and Challenges. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2311.07601 (2023)."},{"key":"e_1_3_3_2_12_2","doi-asserted-by":"publisher","DOI":"10.1145\/3638067.3638100"},{"key":"e_1_3_3_2_13_2","doi-asserted-by":"publisher","DOI":"10.1145\/3639701.3656303"},{"key":"e_1_3_3_2_14_2","doi-asserted-by":"crossref","unstructured":"Jack Hessel Ari Holtzman Maxwell Forbes Ronan\u00a0Le Bras and Yejin Choi. 2021. Clipscore: A reference-free evaluation metric for image captioning. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2104.08718 (2021).","DOI":"10.18653\/v1\/2021.emnlp-main.595"},{"key":"e_1_3_3_2_15_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642224"},{"key":"e_1_3_3_2_16_2","doi-asserted-by":"publisher","DOI":"10.1145\/3267305.3267667"},{"key":"e_1_3_3_2_17_2","doi-asserted-by":"crossref","unstructured":"Andy\u00a0J King Nadine Bol R\u00a0Glenn Cummins and Kevin\u00a0K John. 2019. Improving visual behavior research in communication science: An overview review and reporting recommendations for using eye-tracking methods. Communication Methods and Measures 13 3 (2019) 149\u2013177.","DOI":"10.1080\/19312458.2018.1558194"},{"key":"e_1_3_3_2_18_2","doi-asserted-by":"publisher","DOI":"10.1002\/9780470757642.ch12"},{"key":"e_1_3_3_2_19_2","unstructured":"Kai Kunze Pattie Maes FlorianFloyd\u2019 Mueller and Katrin Wolf. 2023. Cognitive Augmentation (Dagstuhl Seminar 22491). (2023)."},{"key":"e_1_3_3_2_20_2","doi-asserted-by":"publisher","DOI":"10.1145\/3491102.3501825"},{"key":"e_1_3_3_2_21_2","doi-asserted-by":"publisher","DOI":"10.1145\/3573051.3593393"},{"key":"e_1_3_3_2_22_2","doi-asserted-by":"crossref","unstructured":"Richard\u00a0E. Mayer and Roxana Moreno. 2003. Nine ways to reduce cognitive load in multimedia learning. Educational Psychologist 38 1 (2003) 43\u201352.","DOI":"10.1207\/S15326985EP3801_6"},{"key":"e_1_3_3_2_23_2","doi-asserted-by":"crossref","unstructured":"Douglas\u00a0L. Nelson Valorie\u00a0S. Reed and John\u00a0R. Walling. 1976. Picture superiority effect. Journal of Experimental Psychology: Human Learning and Memory 2 5 (1976) 523\u2013528.","DOI":"10.1037\/\/0278-7393.2.5.523"},{"key":"e_1_3_3_2_24_2","unstructured":"Long Ouyang Jeffrey Wu Xu Jiang Diogo Almeida Carroll Wainwright Pamela Mishkin Chong Zhang Sandhini Agarwal Katarina Slama Alex Ray et\u00a0al. 2022. Training language models to follow instructions with human feedback. Advances in neural information processing systems 35 (2022) 27730\u201327744."},{"key":"e_1_3_3_2_25_2","doi-asserted-by":"crossref","unstructured":"Allan Paivio. 1991. Dual coding theory: Retrospect and current status. Canadian Journal of Psychology 45 3 (1991) 255\u2013287.","DOI":"10.1037\/h0084295"},{"key":"e_1_3_3_2_26_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642785"},{"key":"e_1_3_3_2_27_2","doi-asserted-by":"publisher","DOI":"10.1145\/3643834.3661613"},{"key":"e_1_3_3_2_28_2","first-page":"8748","volume-title":"International conference on machine learning","author":"Radford Alec","year":"2021","unstructured":"Alec Radford, Jong\u00a0Wook Kim, Chris Hallacy, Aditya Ramesh, Gabriel Goh, Sandhini Agarwal, Girish Sastry, Amanda Askell, Pamela Mishkin, Jack Clark, et\u00a0al. 2021. Learning transferable visual models from natural language supervision. In International conference on machine learning. PMLR, 8748\u20138763."},{"key":"e_1_3_3_2_29_2","first-page":"8821","volume-title":"International conference on machine learning","author":"Ramesh Aditya","year":"2021","unstructured":"Aditya Ramesh, Mikhail Pavlov, Gabriel Goh, Scott Gray, Chelsea Voss, Alec Radford, Mark Chen, and Ilya Sutskever. 2021. Zero-shot text-to-image generation. In International conference on machine learning. Pmlr, 8821\u20138831."},{"key":"e_1_3_3_2_30_2","doi-asserted-by":"publisher","DOI":"10.4324\/9781315771045"},{"key":"e_1_3_3_2_31_2","doi-asserted-by":"crossref","unstructured":"Ulrich Schiefele. 1991. Interest learning and motivation. Educational Psychologist 26 3-4 (1991) 299\u2013323.","DOI":"10.1080\/00461520.1991.9653136"},{"key":"e_1_3_3_2_32_2","doi-asserted-by":"publisher","unstructured":"Albrecht Schmidt. 2017. Augmenting Human Intellect and Amplifying Perception and Cognition. IEEE Pervasive Computing 16 1 (2017) 6\u201310. 10.1109\/MPRV.2017.8","DOI":"10.1109\/MPRV.2017.8"},{"key":"e_1_3_3_2_33_2","doi-asserted-by":"crossref","unstructured":"Roger\u00a0N. Shepard. 1967. Recognition memory for words sentences and pictures. Journal of Verbal Learning and Verbal Behavior 6 1 (1967) 156\u2013163.","DOI":"10.1016\/S0022-5371(67)80067-7"},{"key":"e_1_3_3_2_34_2","unstructured":"Haotian Sun Yuchen Zhuang Lingkai Kong Bo Dai and Chao Zhang. 2024. Adaplanner: Adaptive planning from feedback with language models. Advances in Neural Information Processing Systems 36 (2024)."},{"key":"e_1_3_3_2_35_2","doi-asserted-by":"crossref","unstructured":"Susanne Trauzettel-Klosinski Klaus Dietz IReST\u00a0Study Group et\u00a0al. 2012. Standardized assessment of reading performance: The new international reading speed texts IReST. Investigative ophthalmology & visual science 53 9 (2012) 5452\u20135461.","DOI":"10.1167\/iovs.11-8284"},{"key":"e_1_3_3_2_36_2","doi-asserted-by":"publisher","DOI":"10.1145\/3458709.3459002"},{"key":"e_1_3_3_2_37_2","unstructured":"Ashish Vaswani Noam Shazeer Niki Parmar Jakob Uszkoreit Llion Jones Aidan\u00a0N Gomez \u0141ukasz Kaiser and Illia Polosukhin. 2017. Attention is all you need. Advances in neural information processing systems 30 (2017)."},{"key":"e_1_3_3_2_38_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642548"},{"key":"e_1_3_3_2_39_2","doi-asserted-by":"publisher","DOI":"10.1145\/3640543.3645143"},{"key":"e_1_3_3_2_40_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642803"},{"key":"e_1_3_3_2_41_2","doi-asserted-by":"crossref","unstructured":"Genta\u00a0Indra Winata Andrea Madotto Zhaojiang Lin Rosanne Liu Jason Yosinski and Pascale Fung. 2021. Language models are few-shot multilingual learners. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2109.07684 (2021).","DOI":"10.18653\/v1\/2021.mrl-1.1"},{"key":"e_1_3_3_2_42_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544793.3560382"},{"key":"e_1_3_3_2_43_2","unstructured":"Qi Yang Sergey Nikolenko Marlo Ongpin Ilia Gossoudarev Yu-Yi Chu-Farseeva and Aleksandr Farseev. 2024. SOMONITOR: Explainable Marketing Data Processing and Analysis with Large Language Models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2407.13117 (2024)."},{"key":"e_1_3_3_2_44_2","doi-asserted-by":"crossref","unstructured":"Ruibin Yuan Hanfeng Lin Yi Wang Zeyue Tian Shangda Wu Tianhao Shen Ge Zhang Yuhang Wu Cong Liu Ziya Zhou et\u00a0al. 2024. Chatmusician: Understanding and generating music intrinsically with llm. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2402.16153 (2024).","DOI":"10.18653\/v1\/2024.findings-acl.373"}],"event":{"name":"AHs 2025: The Augmented Humans International Conference","location":"Masdar City, Abu Dhabi United Arab Emirates","acronym":"AHs '25","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction"]},"container-title":["Proceedings of the Augmented Humans International Conference 2025"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3745900.3746066","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,9]],"date-time":"2025-10-09T12:02:44Z","timestamp":1760011364000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3745900.3746066"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3,16]]},"references-count":43,"alternative-id":["10.1145\/3745900.3746066","10.1145\/3745900"],"URL":"https:\/\/doi.org\/10.1145\/3745900.3746066","relation":{},"subject":[],"published":{"date-parts":[[2025,3,16]]},"assertion":[{"value":"2025-10-09","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}