{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,1,11]],"date-time":"2025-01-11T05:32:56Z","timestamp":1736573576040,"version":"3.32.0"},"reference-count":24,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,11,9]],"date-time":"2024-11-09T00:00:00Z","timestamp":1731110400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,11,9]],"date-time":"2024-11-09T00:00:00Z","timestamp":1731110400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,11,9]]},"DOI":"10.1109\/scisisis61014.2024.10759966","type":"proceedings-article","created":{"date-parts":[[2024,12,2]],"date-time":"2024-12-02T18:35:23Z","timestamp":1733164523000},"page":"1-6","source":"Crossref","is-referenced-by-count":0,"title":["Verbal Description Focusing on Physical Properties of Real-World Environments"],"prefix":"10.1109","author":[{"given":"Eri","family":"Kuroda","sequence":"first","affiliation":[{"name":"Ochanomizu University,Tokyo,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yuki","family":"Taya","sequence":"additional","affiliation":[{"name":"Ochanomizu University,Tokyo,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ichiro","family":"Kobayashi","sequence":"additional","affiliation":[{"name":"Ochanomizu University,Tokyo,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-31635-3_22"},{"volume-title":"A path towards autonomous machine intelligence","author":"LeCun","key":"ref2"},{"volume-title":"Deep predictive coding networks for video prediction and unsupervised learning","year":"2016","author":"Lotter","key":"ref3"},{"key":"ref4","article-title":"Predrnn: Recurrent neural networks for predictive learning using spatiotemporal lstms","volume-title":"Advances in Neural Information Processing Systems","volume":"30","author":"Wang","year":"2017"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2022.3165153"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2023.3240857"},{"volume-title":"CLEVR: A diagnostic dataset for compositional language and elementary visual reasoning","year":"2016","author":"Johnson","key":"ref7"},{"volume-title":"CLEVRER: CoLlision events for video REpresentation and reasoning","year":"2019","author":"Yi","key":"ref8"},{"volume-title":"MONet: Unsupervised scene decomposition and representation","year":"2019","author":"Christopher","key":"ref9"},{"volume-title":"CLEVRER- Humans: Describing physical and causal events the human way","year":"2022","author":"Mao","key":"ref10"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.acl-long.159"},{"volume-title":"Variational temporal abstraction","year":"2019","author":"Kim","key":"ref12"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-45275-8_29"},{"volume-title":"Variational dropout and the local reparameterization trick","year":"2015","author":"Diederik","key":"ref14"},{"key":"ref15","first-page":"311","article-title":"BLEU: a method for automatic evaluation of machine translation","volume-title":"Proceedings of the 40th Annual Meeting on Association for Computational Linguistics, ACL \u201802","author":"Papineni","year":"2002"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.3115\/1626355.1626389"},{"volume-title":"CIDEr: Consensus-based image description evaluation","year":"2014","author":"Vedantam","key":"ref17"},{"volume-title":"Exploring the limits of transfer learning with a unified Text-to- Text transformer","year":"2019","author":"Raffel","key":"ref18"},{"volume-title":"Attention is all you need","year":"2017","author":"Vaswani","key":"ref19"},{"key":"ref20","article-title":"Decoupled weight decay regularization","author":"Loshchilov","year":"2017","journal-title":"arXiv [cs.LG]"},{"key":"ref21","article-title":"BERTScore: Evaluating text generation with BERT","author":"Zhang","year":"2019","journal-title":"arXiv [cs.CL]"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.704"},{"key":"ref23","first-page":"74","article-title":"ROUGE: A package for automatic evaluation of summaries","volume-title":"Text Summarization Branches Out","author":"Lin","year":"2004"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.153"}],"event":{"name":"2024 Joint 13th International Conference on Soft Computing and Intelligent Systems and 25th International Symposium on Advanced Intelligent Systems (SCIS&amp;ISIS)","start":{"date-parts":[[2024,11,9]]},"location":"Himeji, Japan","end":{"date-parts":[[2024,11,12]]}},"container-title":["2024 Joint 13th International Conference on Soft Computing and Intelligent Systems and 25th International Symposium on Advanced Intelligent Systems (SCIS&amp;amp;ISIS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10759795\/10759863\/10759966.pdf?arnumber=10759966","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,10]],"date-time":"2025-01-10T19:45:37Z","timestamp":1736538337000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10759966\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,9]]},"references-count":24,"URL":"https:\/\/doi.org\/10.1109\/scisisis61014.2024.10759966","relation":{},"subject":[],"published":{"date-parts":[[2024,11,9]]}}}