{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,7,5]],"date-time":"2026-07-05T21:14:41Z","timestamp":1783286081946,"version":"3.54.6"},"publisher-location":"New York, NY, USA","reference-count":121,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2026,3,23]]},"DOI":"10.1145\/3742413.3789142","type":"proceedings-article","created":{"date-parts":[[2026,3,3]],"date-time":"2026-03-03T11:32:24Z","timestamp":1772537544000},"page":"1362-1386","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Canvas3D: Empowering Precise Spatial Control for Image Generation with Constraints from a 3D Virtual Canvas"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-6196-1176","authenticated-orcid":false,"given":"Yuzhao","family":"Chen","sequence":"first","affiliation":[{"name":"Elmore Family School of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8256-6419","authenticated-orcid":false,"given":"Runlin","family":"Duan","sequence":"additional","affiliation":[{"name":"School of Mechanical Engineering, Purdue University, West Lafayette, IN, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-3723-5482","authenticated-orcid":false,"given":"Rahul","family":"Jain","sequence":"additional","affiliation":[{"name":"Elmore Family School of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-9385-4456","authenticated-orcid":false,"given":"Yichen","family":"Hu","sequence":"additional","affiliation":[{"name":"Department of Computer Sciences, Purdue University, West Lafayette, IN, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-3408-2876","authenticated-orcid":false,"given":"Chenfei","family":"Zhu","sequence":"additional","affiliation":[{"name":"School of Mechanical Engineering, Purdue University, West Lafayette, IN, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5159-2235","authenticated-orcid":false,"given":"Jingyu","family":"Shi","sequence":"additional","affiliation":[{"name":"Elmore Family School of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8639-5135","authenticated-orcid":false,"given":"Karthik","family":"Ramani","sequence":"additional","affiliation":[{"name":"School of Mechanical Engineering, Purdue University, West Lafayette, IN, USA and Elmore Family School of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2026,3,22]]},"reference":[{"key":"e_1_3_3_2_2_2","doi-asserted-by":"crossref","unstructured":"Remi Alkemade Fons\u00a0J Verbeek and Stephan\u00a0G Lukosch. 2017. On the efficiency of a VR hand gesture-based interface for 3D object manipulations in conceptual design. International Journal of Human\u2013Computer Interaction 33 11 (2017) 882\u2013901.","DOI":"10.1080\/10447318.2017.1296074"},{"key":"e_1_3_3_2_3_2","unstructured":"Autodesk. 2025. Autodesk | 3D Design Engineering & Construction Software. https:\/\/www.autodesk.com\/ Accessed: 2025-04-09."},{"key":"e_1_3_3_2_4_2","doi-asserted-by":"publisher","DOI":"10.1145\/3680528.3687590"},{"key":"e_1_3_3_2_5_2","doi-asserted-by":"publisher","DOI":"10.1145\/3025453.3025863"},{"key":"e_1_3_3_2_6_2","doi-asserted-by":"publisher","DOI":"10.1145\/3641519.3657525"},{"key":"e_1_3_3_2_7_2","doi-asserted-by":"publisher","DOI":"10.1145\/3586183.3606725"},{"key":"e_1_3_3_2_8_2","unstructured":"Wenxiao Cai Iaroslav Ponomarenko Jianhao Yuan Xiaoqi Li Wankou Yang Hao Dong and Bo Zhao. 2024. Spatialbot: Precise spatial understanding with vision language models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2406.13642 (2024)."},{"key":"e_1_3_3_2_9_2","doi-asserted-by":"crossref","unstructured":"Zhe Cao Gines Hidalgo Tomas Simon Shih-En Wei and Yaser Sheikh. 2019. Openpose: Realtime multi-person 2d pose estimation using part affinity fields. IEEE transactions on pattern analysis and machine intelligence 43 1 (2019) 172\u2013186.","DOI":"10.1109\/TPAMI.2019.2929257"},{"key":"e_1_3_3_2_10_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.143"},{"key":"e_1_3_3_2_11_2","unstructured":"Angel\u00a0X Chang Thomas Funkhouser Leonidas Guibas Pat Hanrahan Qixing Huang Zimo Li Silvio Savarese Manolis Savva Shuran Song Hao Su et\u00a0al. 2015. Shapenet: An information-rich 3d model repository. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1512.03012 (2015)."},{"key":"e_1_3_3_2_12_2","doi-asserted-by":"crossref","unstructured":"Hila Chefer Yuval Alaluf Yael Vinker Lior Wolf and Daniel Cohen-Or. 2023. Attend-and-excite: Attention-based semantic guidance for text-to-image diffusion models. ACM transactions on Graphics (TOG) 42 4 (2023) 1\u201310.","DOI":"10.1145\/3592116"},{"key":"e_1_3_3_2_13_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642794"},{"key":"e_1_3_3_2_14_2","doi-asserted-by":"publisher","DOI":"10.1145\/3586183.3606777"},{"key":"e_1_3_3_2_15_2","doi-asserted-by":"crossref","unstructured":"Charles\u00a0E Connor and James\u00a0J Knierim. 2017. Integration of objects and space in perception and memory. Nature neuroscience 20 11 (2017) 1493\u20131503.","DOI":"10.1038\/nn.4657"},{"key":"e_1_3_3_2_16_2","doi-asserted-by":"publisher","DOI":"10.1145\/3491102.3502141"},{"key":"e_1_3_3_2_17_2","doi-asserted-by":"crossref","unstructured":"Jonas Degrave Michiel Hermans Joni Dambre and Francis Wyffels. 2019. A differentiable physics engine for deep learning in robotics. Frontiers in neurorobotics 13 (2019) 6.","DOI":"10.3389\/fnbot.2019.00006"},{"key":"e_1_3_3_2_18_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01263"},{"key":"e_1_3_3_2_19_2","volume-title":"Spatial cognition, spatial perception: mapping the self and space","author":"Dolins Francine\u00a0L","year":"2010","unstructured":"Francine\u00a0L Dolins and Robert\u00a0W Mitchell. 2010. Spatial cognition, spatial perception: mapping the self and space. Cambridge University Press."},{"key":"e_1_3_3_2_20_2","doi-asserted-by":"publisher","DOI":"10.1145\/3641519.3657425"},{"key":"e_1_3_3_2_21_2","doi-asserted-by":"crossref","unstructured":"Runlin Duan Xiyun Hu Min Liu Jingyu Shi and Karthik Ramani. 2025. pARametric: Empowering In Situ Parametric Modeling in Augment Reality for Personal Fabrication. Journal of Computing and Information Science in Engineering 25 4 (2025) 041001.","DOI":"10.1115\/1.4067704"},{"key":"e_1_3_3_2_22_2","doi-asserted-by":"publisher","DOI":"10.1115\/DETC2024-146409"},{"key":"e_1_3_3_2_23_2","doi-asserted-by":"publisher","DOI":"10.1145\/3715336.3735824"},{"key":"e_1_3_3_2_24_2","unstructured":"Runlin Duan Chenfei Zhu Yuzhao Chen Dizhi Ma Jingyu Shi Ziyi Liu and Karthik Ramani. 2025. SketchConcept: Sketching-based Concept Recomposition for Product Design using Generative AI. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2508.07141 (2025)."},{"key":"e_1_3_3_2_25_2","doi-asserted-by":"publisher","DOI":"10.1201\/b18212"},{"key":"e_1_3_3_2_26_2","unstructured":"Abdelrahman Eldesokey and Peter Wonka. 2024. Build-a-scene: Interactive 3d layout control for diffusion-based image generation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2408.14819 (2024)."},{"key":"e_1_3_3_2_27_2","unstructured":"Inc. Exocortex\u00a0Technologies. 2013. Clara.io: Online 3D Modeling 3D Rendering Free 3D Models. https:\/\/clara.io\/ Accessed: 2025-04-07."},{"key":"e_1_3_3_2_28_2","volume-title":"The nature of landscape design","author":"Fairbrother Nan","year":"1974","unstructured":"Nan Fairbrother. 1974. The nature of landscape design. Architectural Press London."},{"key":"e_1_3_3_2_29_2","doi-asserted-by":"crossref","unstructured":"Weixi Feng Wanrong Zhu Tsu-jui Fu Varun Jampani Arjun Akula Xuehai He Sugato Basu Xin\u00a0Eric Wang and William\u00a0Yang Wang. 2023. Layoutgpt: Compositional visual planning and generation with large language models. Advances in Neural Information Processing Systems 36 (2023) 18225\u201318250.","DOI":"10.52202\/075280-0802"},{"key":"e_1_3_3_2_30_2","doi-asserted-by":"crossref","unstructured":"Donato Fiorella Andrea Sanna and Fabrizio Lamberti. 2010. Multi-touch user interface evaluation for 3D object manipulation on mobile devices. Journal on Multimodal User Interfaces 4 (2010) 3\u201310.","DOI":"10.1007\/s12193-009-0034-4"},{"key":"e_1_3_3_2_31_2","doi-asserted-by":"crossref","unstructured":"Gaspare Galati Gina Pelle Alain Berthoz and Giorgia Committeri. 2010. Multiple reference frames used by the human brain for spatial perception and memory. Experimental brain research 206 (2010) 109\u2013120.","DOI":"10.1007\/s00221-010-2168-8"},{"key":"e_1_3_3_2_32_2","doi-asserted-by":"crossref","unstructured":"Ruiqi Gao Aleksander Holynski Philipp Henzler Arthur Brussee Ricardo Martin-Brualla Pratul Srinivasan Jonathan\u00a0T Barron and Ben Poole. 2024. Cat3d: Create anything in 3d with multi-view diffusion models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2405.10314 (2024).","DOI":"10.52202\/079017-2403"},{"key":"e_1_3_3_2_33_2","doi-asserted-by":"publisher","DOI":"10.4324\/9781315740218"},{"key":"e_1_3_3_2_34_2","doi-asserted-by":"crossref","unstructured":"Eg\u00a0Su Goh Mohd\u00a0Shahrizal Sunar and Ajune\u00a0Wanis Ismail. 2019. 3D object manipulation techniques in handheld mobile augmented reality interface: A review. IEEE Access 7 (2019) 40581\u201340601.","DOI":"10.1109\/ACCESS.2019.2906394"},{"key":"e_1_3_3_2_35_2","unstructured":"Tejas Gokhale Hamid Palangi Besmira Nushi Vibhav Vineet Eric Horvitz Ece Kamar Chitta Baral and Yezhou Yang. 2022. Benchmarking spatial relationships in text-to-image generation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2212.10015 (2022)."},{"key":"e_1_3_3_2_36_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-7091-6242-2_8"},{"key":"e_1_3_3_2_37_2","doi-asserted-by":"crossref","unstructured":"Daniel Gopher Lilach Armony and Yaakov Greenshpan. 2000. Switching tasks and attention policies.Journal of Experimental Psychology: General 129 3 (2000) 308.","DOI":"10.1037\/0096-3445.129.3.308"},{"key":"e_1_3_3_2_38_2","doi-asserted-by":"crossref","unstructured":"Daniel\u00a0J Graham and Christoph Redies. 2010. Statistical regularities in art: Relations with visual coding and perception. Vision research 50 16 (2010) 1503\u20131509.","DOI":"10.1016\/j.visres.2010.05.002"},{"key":"e_1_3_3_2_39_2","unstructured":"SG Hart. 1988. Development of NASA-TLX (Task Load Index): Results of empirical and theoretical research. Human mental workload\/Elsevier (1988)."},{"key":"e_1_3_3_2_40_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544548.3580704"},{"key":"e_1_3_3_2_41_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642224"},{"key":"e_1_3_3_2_42_2","doi-asserted-by":"crossref","unstructured":"Kaiyi Huang Chengqi Duan Kaiyue Sun Enze Xie Zhenguo Li and Xihui Liu. 2025. T2I-CompBench++: An Enhanced and Comprehensive Benchmark for Compositional Text-to-Image Generation. IEEE Transactions on Pattern Analysis and Machine Intelligence (2025).","DOI":"10.1109\/TPAMI.2025.3531907"},{"key":"e_1_3_3_2_43_2","doi-asserted-by":"crossref","unstructured":"Zheng Huang Qiang Liu Stephen Westland Michael\u00a0R Pointer M\u00a0Ronnier Luo and Kaida Xiao. 2018. Light dominates colour preference when correlated colour temperature differs. Lighting Research & Technology 50 7 (2018) 995\u20131012.","DOI":"10.1177\/1477153517713542"},{"key":"e_1_3_3_2_44_2","unstructured":"Adobe Inc.2025. Adobe Substance 3D Stager. https:\/\/www.adobe.com\/products\/substance3d\/apps\/stager.html Accessed: 2025-04-07."},{"key":"e_1_3_3_2_45_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706598.3714292"},{"key":"e_1_3_3_2_46_2","volume-title":"Eurographics 2013-STAR","author":"Jankowski Jacek","year":"2013","unstructured":"Jacek Jankowski and Martin Hachet. 2013. A survey of interaction techniques for interactive 3D environments. In Eurographics 2013-STAR."},{"key":"e_1_3_3_2_47_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411764.3445093"},{"key":"e_1_3_3_2_48_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01465"},{"key":"e_1_3_3_2_49_2","doi-asserted-by":"publisher","DOI":"10.5555\/2328888.2328898"},{"key":"e_1_3_3_2_50_2","doi-asserted-by":"crossref","unstructured":"Minseok Kim and Jae\u00a0Yeol Lee. 2016. Touch and hand gesture-based interactions for directly manipulating 3D virtual objects in mobile augmented reality. Multimedia Tools and Applications 75 (2016) 16529\u201316550.","DOI":"10.1007\/s11042-016-3355-9"},{"key":"e_1_3_3_2_51_2","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300863"},{"key":"e_1_3_3_2_52_2","doi-asserted-by":"crossref","unstructured":"James\u00a0M Leonhardt Jesse\u00a0R Catlin and Dante\u00a0M Pirouz. 2015. Is your product facing the ad\u2019s center? Facing direction affects processing fluency and ad evaluation. Journal of Advertising 44 4 (2015) 315\u2013325.","DOI":"10.1080\/00913367.2015.1048911"},{"key":"e_1_3_3_2_53_2","doi-asserted-by":"crossref","unstructured":"Mieke\u00a0HR Leyssen Sarah Linsen Jonathan Sammartino and Stephen\u00a0E Palmer. 2012. Aesthetic preference for spatial composition in multiobject pictures. i-Perception 3 1 (2012) 25\u201349.","DOI":"10.1068\/i0458aap"},{"key":"e_1_3_3_2_54_2","doi-asserted-by":"publisher","DOI":"10.1145\/3654777.3676325"},{"key":"e_1_3_3_2_55_2","unstructured":"Xirui Li Charles Herrmann Kelvin\u00a0CK Chan Yinxiao Li Deqing Sun Chao Ma and Ming-Hsuan Yang. 2024. A simple approach to unifying diffusion-based conditional generation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2410.11439 (2024)."},{"key":"e_1_3_3_2_56_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01765"},{"key":"e_1_3_3_2_57_2","doi-asserted-by":"publisher","DOI":"10.1145\/3672539.3686339"},{"key":"e_1_3_3_2_58_2","unstructured":"David Chuan-En Lin Hyeonsu\u00a0B Kang Nikolas Martelaro Aniket Kittur Yan-Ying Chen and Matthew\u00a0K Hong. 2025. Inkspire: Supporting Design Exploration with Generative AI through Analogical Sketching. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2501.18588 (2025)."},{"key":"e_1_3_3_2_59_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706598.3713801"},{"key":"e_1_3_3_2_60_2","unstructured":"Daochang Liu Junyu Zhang Anh-Dung Dinh Eunbyung Park Shichao Zhang and Chang Xu. 2025. Generative Physical AI in Vision: A Survey. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2501.10928 (2025)."},{"key":"e_1_3_3_2_61_2","doi-asserted-by":"publisher","DOI":"10.1145\/3563657.3596098"},{"key":"e_1_3_3_2_62_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544548.3581442"},{"key":"e_1_3_3_2_63_2","doi-asserted-by":"crossref","unstructured":"Tiange Luo Chris Rockwell Honglak Lee and Justin Johnson. 2023. Scalable 3d captioning with pretrained models. Advances in Neural Information Processing Systems 36 (2023) 75307\u201375337.","DOI":"10.52202\/075280-3291"},{"key":"e_1_3_3_2_64_2","unstructured":"Hira Maqbool. 2023. Aesthetic choices: Defining the range of aesthetic views in interactive digital media including games and 3D virtual environments (3D VEs). (2023)."},{"key":"e_1_3_3_2_65_2","doi-asserted-by":"publisher","DOI":"10.1111\/cgf.13390"},{"key":"e_1_3_3_2_66_2","doi-asserted-by":"crossref","unstructured":"Siwei Meng Yawei Luo and Ping Liu. 2025. Grounding Creativity in Physics: A Brief Survey of Physical Priors in AIGC. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2502.07007 (2025).","DOI":"10.24963\/ijcai.2025\/1176"},{"key":"e_1_3_3_2_67_2","unstructured":"Zhenxing Mi Kuan-Chieh Wang Guocheng Qian Hanrong Ye Runtao Liu Sergey Tulyakov Kfir Aberman and Dan Xu. 2025. I Think Therefore I Diffuse: Enabling Multimodal In-Context Reasoning in Diffusion Models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2502.10458 (2025)."},{"key":"e_1_3_3_2_68_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i5.28226"},{"key":"e_1_3_3_2_69_2","doi-asserted-by":"crossref","unstructured":"Maria\u00a0Adriana Neroni Alfred Oti and Nathan Crilly. 2021. Virtual Reality design-build-test games with physics simulation: opportunities for researching design cognition. International Journal of Design Creativity and Innovation 9 3 (2021) 139\u2013173.","DOI":"10.1080\/21650349.2021.1929500"},{"key":"e_1_3_3_2_70_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642440"},{"key":"e_1_3_3_2_71_2","unstructured":"Open Robotics. 2025. Robot Operating System (ROS). https:\/\/www.ros.org\/ Accessed: 2025-04-09."},{"key":"e_1_3_3_2_72_2","unstructured":"OpenAI. 2025. OpenAI. https:\/\/openai.com\/ Accessed: 2025-04-09."},{"key":"e_1_3_3_2_73_2","unstructured":"Jonas Oppenlaender Rhema Linder and Johanna Silvennoinen. 2024. Prompting AI art: An investigation into the creative skill of prompt engineering. International journal of human\u2013computer interaction (2024) 1\u201323."},{"key":"e_1_3_3_2_74_2","doi-asserted-by":"crossref","unstructured":"Stephen\u00a0E Palmer Jonathan\u00a0S Gardner and Thomas\u00a0D Wickens. 2008. Aesthetic issues in spatial composition: Effects of position and direction on framing single objects. Spatial vision 21 3 (2008) 421\u2013450.","DOI":"10.1163\/156856808784532662"},{"key":"e_1_3_3_2_75_2","doi-asserted-by":"crossref","unstructured":"Stephen\u00a0E Palmer Karen\u00a0B Schloss and Jonathan Sammartino. 2013. Visual aesthetics and human preference. Annual review of psychology 64 1 (2013) 77\u2013107.","DOI":"10.1146\/annurev-psych-120710-100504"},{"key":"e_1_3_3_2_76_2","doi-asserted-by":"publisher","DOI":"10.1145\/3588432.3591500"},{"key":"e_1_3_3_2_77_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706599.3719802"},{"key":"e_1_3_3_2_78_2","volume-title":"Composition in art","author":"Poore Henry\u00a0Rankin","year":"1976","unstructured":"Henry\u00a0Rankin Poore. 1976. Composition in art. Courier Corporation."},{"key":"e_1_3_3_2_79_2","doi-asserted-by":"publisher","DOI":"10.1145\/3526113.3545663"},{"key":"e_1_3_3_2_80_2","doi-asserted-by":"crossref","unstructured":"Can Qin Shu Zhang Ning Yu Yihao Feng Xinyi Yang Yingbo Zhou Huan Wang Juan\u00a0Carlos Niebles Caiming Xiong Silvio Savarese et\u00a0al. 2023. Unicontrol: A unified diffusion model for controllable visual generation in the wild. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2305.11147 (2023).","DOI":"10.52202\/075280-1862"},{"key":"e_1_3_3_2_81_2","unstructured":"Aditya Ramesh Prafulla Dhariwal Alex Nichol Casey Chu and Mark Chen. 2022. Hierarchical text-conditional image generation with clip latents. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2204.06125 1 2 (2022) 3."},{"key":"e_1_3_3_2_82_2","first-page":"8821","volume-title":"International conference on machine learning","author":"Ramesh Aditya","year":"2021","unstructured":"Aditya Ramesh, Mikhail Pavlov, Gabriel Goh, Scott Gray, Chelsea Voss, Alec Radford, Mark Chen, and Ilya Sutskever. 2021. Zero-shot text-to-image generation. In International conference on machine learning. Pmlr, 8821\u20138831."},{"key":"e_1_3_3_2_83_2","doi-asserted-by":"crossref","unstructured":"Nils Reimers and Iryna Gurevych. 2019. Sentence-bert: Sentence embeddings using siamese bert-networks. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1908.10084 (2019).","DOI":"10.18653\/v1\/D19-1410"},{"key":"e_1_3_3_2_84_2","doi-asserted-by":"publisher","DOI":"10.1145\/1622176.1622190"},{"key":"e_1_3_3_2_85_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"e_1_3_3_2_86_2","doi-asserted-by":"crossref","unstructured":"Jonathan Sammartino and Stephen\u00a0E Palmer. 2012. Aesthetic issues in spatial composition: Effects of vertical position and perspective on framing single objects.Journal of Experimental Psychology: Human Perception and Performance 38 4 (2012) 865.","DOI":"10.1037\/a0027736"},{"key":"e_1_3_3_2_87_2","doi-asserted-by":"crossref","unstructured":"Kevin\u00a0L Sample Henrik Hagtvedt and S\u00a0Adam Brasel. 2020. Components of visual perception in marketing contexts: A conceptual framework and review. Journal of the Academy of Marketing Science 48 (2020) 405\u2013421.","DOI":"10.1007\/s11747-019-00684-4"},{"key":"e_1_3_3_2_88_2","doi-asserted-by":"publisher","DOI":"10.1145\/3654777.3676444"},{"key":"e_1_3_3_2_89_2","doi-asserted-by":"publisher","DOI":"10.1109\/3DUI.2012.6184195"},{"key":"e_1_3_3_2_90_2","doi-asserted-by":"crossref","unstructured":"Jingyu Shi Rahul Jain Seungguen Chi Hyungjun Doh Hyunggun Chi Alexander\u00a0J Quinn and Karthik Ramani. 2025. CARING-AI: Towards Authoring Context-aware Augmented Reality INstruction through Generative Artificial Intelligence. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2501.16557 (2025).","DOI":"10.1145\/3706598.3713348"},{"key":"e_1_3_3_2_91_2","unstructured":"Jingyu Shi Rahul Jain Runlin Duan and Karthik Ramani. 2023. Understanding generative AI in art: an interview study with artists on G-AI from an HCI perspective. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2310.13149 (2023)."},{"key":"e_1_3_3_2_92_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706598.3714087"},{"key":"e_1_3_3_2_93_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642391"},{"key":"e_1_3_3_2_94_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00844"},{"key":"e_1_3_3_2_95_2","doi-asserted-by":"publisher","DOI":"10.1145\/3680528.3687668"},{"key":"e_1_3_3_2_96_2","doi-asserted-by":"crossref","unstructured":"Dirk Sikkel Reinder Steenbergen and Sjoerd Gras. 2014. Clicking vs. dragging: Different uses of the mouse and their implications for online surveys. Public opinion quarterly 78 1 (2014) 177\u2013190.","DOI":"10.1093\/poq\/nft077"},{"key":"e_1_3_3_2_97_2","unstructured":"Fan-Yun Sun Weiyu Liu Siyi Gu Dylan Lim Goutam Bhat Federico Tombari Manling Li Nick Haber and Jiajun Wu. 2024. LayoutVLM: Differentiable Optimization of 3D Layout via Vision-Language Models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2412.02193 (2024)."},{"key":"e_1_3_3_2_98_2","unstructured":"Jiao Sun Deqing Fu Yushi Hu Su Wang Royi Rassin Da-Cheng Juan Dana Alon Charles Herrmann Sjoerd van Steenkiste Ranjay Krishna et\u00a0al. 2023. Dreamsync: Aligning text-to-image generation with image understanding feedback. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2311.17946 (2023)."},{"key":"e_1_3_3_2_99_2","doi-asserted-by":"crossref","unstructured":"Kamila Svobodova Petr Sklenicka Kristina Molnarova and Jiri Vojar. 2014. Does the composition of landscape photographs affect visual preferences? The rule of the Golden Section and the position of the horizon. Journal of Environmental Psychology 38 (2014) 143\u2013152.","DOI":"10.1016\/j.jenvp.2014.01.005"},{"key":"e_1_3_3_2_100_2","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2000.844073"},{"key":"e_1_3_3_2_101_2","unstructured":"Unity Technologies. [n. d.]. Unity Real-Time Development Platform | 3D 2D VR & AR Engine. https:\/\/unity.com\/ Accessed: 2025-04-08."},{"key":"e_1_3_3_2_102_2","doi-asserted-by":"crossref","unstructured":"Troy\u00a0AW Visser Walter\u00a0F Bischof and Vincent Di\u00a0Lollo. 1999. Attentional switching in spatial and nonspatial domains: Evidence from the attentional blink.Psychological Bulletin 125 4 (1999) 458.","DOI":"10.1037\/0033-2909.125.4.458"},{"key":"e_1_3_3_2_103_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642919"},{"key":"e_1_3_3_2_104_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642901"},{"key":"e_1_3_3_2_105_2","doi-asserted-by":"publisher","DOI":"10.1145\/3472749.3474769"},{"key":"e_1_3_3_2_106_2","doi-asserted-by":"crossref","unstructured":"Zhenwei Wang Nanxuan Zhao Gerhard\u00a0P Hancke and Rynson\u00a0WH Lau. 2023. Language-based Photo Color Adjustment for Graphic Designs.ACM Trans. Graph. 42 4 (2023) 101\u20131.","DOI":"10.1145\/3592111"},{"key":"e_1_3_3_2_107_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01825"},{"key":"e_1_3_3_2_108_2","doi-asserted-by":"publisher","DOI":"10.1145\/3311350.3347175"},{"key":"e_1_3_3_2_109_2","doi-asserted-by":"publisher","DOI":"10.1145\/2821592.2821606"},{"key":"e_1_3_3_2_110_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00608"},{"key":"e_1_3_3_2_111_2","doi-asserted-by":"crossref","unstructured":"Taoxi Yang Sarita Silveira Arusu Formuli Marco Paolini Ernst P\u00f6ppel Tilmann Sander and Yan Bao. 2019. Aesthetic experiences across cultures: Neural correlates when viewing traditional Eastern or Western landscape paintings. Frontiers in psychology 10 (2019) 798.","DOI":"10.3389\/fpsyg.2019.00798"},{"key":"e_1_3_3_2_112_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00407"},{"key":"e_1_3_3_2_113_2","doi-asserted-by":"publisher","DOI":"10.1145\/3654777.3676399"},{"key":"e_1_3_3_2_114_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00355"},{"key":"e_1_3_3_2_115_2","volume-title":"The Thirteenth International Conference on Learning Representations","author":"Zhang Lvmin","year":"2025","unstructured":"Lvmin Zhang, Anyi Rao, and Maneesh Agrawala. 2025. Scaling in-the-wild training for diffusion-based illumination harmonization and editing by imposing consistent light transport. In The Thirteenth International Conference on Learning Representations."},{"key":"e_1_3_3_2_116_2","doi-asserted-by":"crossref","unstructured":"Yuli Zhang Hyokjin Kwak Haeyoung Jeong and Marina Puzakova. 2019. Facing the \u201cright\u201d side? The effect of product facing direction. Journal of Advertising 48 2 (2019) 153\u2013166.","DOI":"10.1080\/00913367.2018.1503576"},{"key":"e_1_3_3_2_117_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2012.6467469"},{"key":"e_1_3_3_2_118_2","unstructured":"Zibo Zhao Zeqiang Lai Qingxiang Lin Yunfei Zhao Haolin Liu Shuhui Yang Yifei Feng Mingxin Yang Sheng Zhang Xianghui Yang et\u00a0al. 2025. Hunyuan3d 2.0: Scaling diffusion models for high resolution textured 3d assets generation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2501.12202 (2025)."},{"key":"e_1_3_3_2_119_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.02154"},{"key":"e_1_3_3_2_120_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00742"},{"key":"e_1_3_3_2_121_2","doi-asserted-by":"publisher","DOI":"10.1145\/3746059.3747676"},{"key":"e_1_3_3_2_122_2","doi-asserted-by":"publisher","DOI":"10.1145\/3526113.3545668"}],"event":{"name":"IUI '26: 31st International Conference on Intelligent User Interfaces","location":"Paphos Cyprus","acronym":"IUI '26","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction","SIGAI ACM Special Interest Group on Artificial Intelligence"]},"container-title":["Proceedings of the 31st International Conference on Intelligent User Interfaces"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3742413.3789142","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,7,5]],"date-time":"2026-07-05T20:26:50Z","timestamp":1783283210000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3742413.3789142"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,3,22]]},"references-count":121,"alternative-id":["10.1145\/3742413.3789142","10.1145\/3742413"],"URL":"https:\/\/doi.org\/10.1145\/3742413.3789142","relation":{},"subject":[],"published":{"date-parts":[[2026,3,22]]},"assertion":[{"value":"2026-03-22","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}