{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,10]],"date-time":"2025-12-10T09:08:40Z","timestamp":1765357720994,"version":"3.40.3"},"publisher-location":"Cham","reference-count":74,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031732416"},{"type":"electronic","value":"9783031732423"}],"license":[{"start":{"date-parts":[[2024,10,29]],"date-time":"2024-10-29T00:00:00Z","timestamp":1730160000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,10,29]],"date-time":"2024-10-29T00:00:00Z","timestamp":1730160000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-73242-3_4","type":"book-chapter","created":{"date-parts":[[2024,10,28]],"date-time":"2024-10-28T09:15:43Z","timestamp":1730106943000},"page":"56-74","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["WebRPG: Automatic Web Rendering Parameters Generation for\u00a0Visual Presentation"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4210-070X","authenticated-orcid":false,"given":"Zirui","family":"Shao","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-3206-5347","authenticated-orcid":false,"given":"Feiyu","family":"Gao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1770-005X","authenticated-orcid":false,"given":"Hangdi","family":"Xing","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-1510-6455","authenticated-orcid":false,"given":"Zepeng","family":"Zhu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-8608-5628","authenticated-orcid":false,"given":"Zhi","family":"Yu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1097-2044","authenticated-orcid":false,"given":"Jiajun","family":"Bu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-3822-2616","authenticated-orcid":false,"given":"Qi","family":"Zheng","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6564-4796","authenticated-orcid":false,"given":"Cong","family":"Yao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,10,29]]},"reference":[{"key":"4_CR1","unstructured":"Alemerien, K., Magel, K.: GUIEvaluator: a metric-tool for evaluating the complexity of graphical user interfaces. In: SEKE, pp. 13\u201318 (2014)"},{"key":"4_CR2","doi-asserted-by":"crossref","unstructured":"Azadi, S., Fisher, M., Kim, V.G., Wang, Z., Shechtman, E., Darrell, T.: Multi-content GAN for few-shot font style transfer. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7564\u20137573 (2018)","DOI":"10.1109\/CVPR.2018.00789"},{"key":"4_CR3","unstructured":"Brown, T., et al.: Language models are few-shot learners. In: Advances in Neural Information Processing Systems, vol. 33, pp. 1877\u20131901 (2020)"},{"key":"4_CR4","doi-asserted-by":"crossref","unstructured":"Chang, H., Zhang, H., Jiang, L., Liu, C., Freeman, W.T.: MaskGIT: masked generative image transformer. In: 2022 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 11305\u201311315 (2022)","DOI":"10.1109\/CVPR52688.2022.01103"},{"key":"4_CR5","doi-asserted-by":"crossref","unstructured":"Chen, L., et al.: WebSRC: a dataset for web-based structural reading comprehension. In: Conference on Empirical Methods in Natural Language Processing (2021)","DOI":"10.18653\/v1\/2021.emnlp-main.343"},{"key":"4_CR6","unstructured":"Chen, N., Zhang, Y., Zen, H., Weiss, R.J., Norouzi, M., Chan, W.: WaveGrad: estimating gradients for waveform generation. In: International Conference on Learning Representations (2021)"},{"key":"4_CR7","doi-asserted-by":"crossref","unstructured":"Chen, N., et al.: WaveGrad 2: iterative refinement for text-to-speech synthesis. arXiv preprint arXiv:2106.09660 (2021)","DOI":"10.21437\/Interspeech.2021-1897"},{"key":"4_CR8","unstructured":"Cheng, C.Y., Huang, F., Li, G., Li, Y.: PLay: parametrically conditioned layout generation using latent diffusion. In: Proceedings of the 40th International Conference on Machine Learning, ICML 2023. JMLR.org (2023)"},{"issue":"1\u20132","key":"4_CR9","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.ijhcs.2009.08.005","volume":"68","author":"D Cyr","year":"2010","unstructured":"Cyr, D., Head, M., Larios, H.: Colour appeal in website design within and across cultures: a multi-method evaluation. Int. J. Hum Comput Stud. 68(1\u20132), 1\u201321 (2010)","journal-title":"Int. J. Hum Comput Stud."},{"key":"4_CR10","unstructured":"Deng, X., Shiralkar, P., Lockard, C., Huang, B., Sun, H.: DOM-LM: learning generalizable representations for HTML documents. arXiv preprint arXiv:2201.10608 (2022)"},{"key":"4_CR11","unstructured":"Dhariwal, P., Nichol, A.: Diffusion models beat GANs on image synthesis. In: Advances in Neural Information Processing Systems, vol. 34, pp. 8780\u20138794 (2021)"},{"key":"4_CR12","unstructured":"Dong, Z., Tang, T., Li, L., Zhao, W.X.: A survey on long text modeling with transformers. arXiv preprint arXiv:2302.14502 (2023)"},{"key":"4_CR13","unstructured":"Du, Y., et al.: Context perception parallel decoder for scene text recognition. arXiv preprint arXiv:2307.12270 (2023)"},{"issue":"2","key":"4_CR14","doi-asserted-by":"publisher","first-page":"168","DOI":"10.1108\/13287260910955129","volume":"11","author":"C Flavian","year":"2009","unstructured":"Flavian, C., Gurrea, R., Orus, C.: Web design: a key factor for the website success. J. Syst. Inf. Technol. 11(2), 168\u2013184 (2009)","journal-title":"J. Syst. Inf. Technol."},{"key":"4_CR15","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"720","DOI":"10.1007\/978-3-540-73354-6_79","volume-title":"Human Interface and the Management of Information. Interacting in Information Environments","author":"F Fu","year":"2007","unstructured":"Fu, F., Chiu, S.-Y., Su, C.H.: Measuring the screen complexity of web pages. In: Smith, M.J., Salvendy, G. (eds.) Human Interface 2007, Part II. LNCS, vol. 4558, pp. 720\u2013729. Springer, Heidelberg (2007). https:\/\/doi.org\/10.1007\/978-3-540-73354-6_79"},{"key":"4_CR16","first-page":"58","volume-title":"Cascading Style Sheets","year":"2008","unstructured":"Furht, B. (ed.): Cascading Style Sheets, p. 58. Springer, Boston (2008)"},{"key":"4_CR17","doi-asserted-by":"publisher","first-page":"46","DOI":"10.1016\/j.cad.2016.03.001","volume":"77","author":"Z Gu","year":"2016","unstructured":"Gu, Z., Lou, J.: Data driven webpage color design. Comput. Aided Des. 77, 46\u201359 (2016)","journal-title":"Comput. Aided Des."},{"key":"4_CR18","unstructured":"Guo, D., et al.: DeepSeek-Coder: when the large language model meets programming\u2013the rise of code intelligence. arXiv preprint arXiv:2401.14196 (2024)"},{"key":"4_CR19","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"210","DOI":"10.1007\/978-3-030-58574-7_13","volume-title":"Computer Vision \u2013 ECCV 2020","author":"R Herzig","year":"2020","unstructured":"Herzig, R., Bar, A., Xu, H., Chechik, G., Darrell, T., Globerson, A.: Learning canonical representations for scene graph to image generation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12371, pp. 210\u2013227. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58574-7_13"},{"key":"4_CR20","unstructured":"Heusel, M., Ramsauer, H., Unterthiner, T., Nessler, B., Hochreiter, S.: GANs trained by a two time-scale update rule converge to a local Nash equilibrium. In: Advances in Neural Information Processing Systems, vol. 30 (2017)"},{"key":"4_CR21","unstructured":"Ho, J., Jain, A., Abbeel, P.: Denoising diffusion probabilistic models. In: Advances in Neural Information Processing Systems, vol. 33, pp. 6840\u20136851 (2020)"},{"key":"4_CR22","unstructured":"Hotti, A., Risuleo, R.S., Magureanu, S., Moradi, A., Lagergren, J.: The klarna product page dataset: a realistic benchmark for web representation learning. arXiv preprint arXiv:2111.02168 (2021)"},{"key":"4_CR23","doi-asserted-by":"crossref","unstructured":"Hui, M., Zhang, Z., Zhang, X., Xie, W., Wang, Y., Lu, Y.: Unifying layout generation with a decoupled diffusion model. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 1942\u20131951 (2023)","DOI":"10.1109\/CVPR52729.2023.00193"},{"key":"4_CR24","doi-asserted-by":"crossref","unstructured":"Inoue, N., Kikuchi, K., Simo-Serra, E., Otani, M., Yamaguchi, K.: LayoutDM: discrete diffusion model for controllable layout generation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10167\u201310176 (2023)","DOI":"10.1109\/CVPR52729.2023.00980"},{"key":"4_CR25","doi-asserted-by":"crossref","unstructured":"Jyothi, A.A., Durand, T., He, J., Sigal, L., Mori, G.: LayoutVAE: stochastic scene layout generation from a label set. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 9895\u20139904 (2019)","DOI":"10.1109\/ICCV.2019.00999"},{"key":"4_CR26","doi-asserted-by":"publisher","DOI":"10.1016\/j.cola.2023.101202","volume":"75","author":"T Kaluarachchi","year":"2023","unstructured":"Kaluarachchi, T., Wickramasinghe, M.: A systematic literature review on automatic website generation. J. Comput. Lang. 75, 101202 (2023)","journal-title":"J. Comput. Lang."},{"key":"4_CR27","doi-asserted-by":"crossref","unstructured":"Kikuchi, K., Inoue, N., Otani, M., Simo-Serra, E., Yamaguchi, K.: Generative colorization of structured mobile web pages. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 3650\u20133659 (2023)","DOI":"10.1109\/WACV56688.2023.00364"},{"key":"4_CR28","doi-asserted-by":"crossref","unstructured":"Kikuchi, K., Otani, M., Yamaguchi, K., Simo-Serra, E.: Modeling visual containment for web page layout optimization. In: Computer Graphics Forum, vol.\u00a040, pp. 33\u201344. Wiley Online Library (2021)","DOI":"10.1111\/cgf.14399"},{"key":"4_CR29","doi-asserted-by":"crossref","unstructured":"Kikuchi, K., Simo-Serra, E., Otani, M., Yamaguchi, K.: Constrained graphic layout generation via latent optimization. In: Proceedings of the 29th ACM International Conference on Multimedia, pp. 88\u201396 (2021)","DOI":"10.1145\/3474085.3475497"},{"key":"4_CR30","unstructured":"Kingma, D.P., Welling, M.: Auto-encoding variational bayes. arXiv preprint arXiv:1312.6114 (2013)"},{"key":"4_CR31","doi-asserted-by":"crossref","unstructured":"Koffka, K.: Principles of Gestalt Psychology (1955)","DOI":"10.1515\/juru.1955.1955.9.322"},{"key":"4_CR32","unstructured":"Kong, Z., Ping, W., Huang, J., Zhao, K., Catanzaro, B.: DiffWave: a versatile diffusion model for audio synthesis. arXiv preprint arXiv:2009.09761 (2020)"},{"key":"4_CR33","unstructured":"Koo, H.: A survey on generative diffusion models for structured data. arXiv preprint arXiv:2306.04139 (2023)"},{"key":"4_CR34","unstructured":"Kumar, V., et al.: SWDE: a sub-word and document embedding based engine for clickbait detection. arXiv preprint arXiv:1808.00957 (2018)"},{"key":"4_CR35","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"491","DOI":"10.1007\/978-3-030-58580-8_29","volume-title":"Computer Vision \u2013 ECCV 2020","author":"H-Y Lee","year":"2020","unstructured":"Lee, H.-Y., et al.: Neural design network: graphic layout generation with constraints. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020, Part III. LNCS, vol. 12348, pp. 491\u2013506. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58580-8_29"},{"key":"4_CR36","doi-asserted-by":"crossref","unstructured":"Lewis, M., et al.: BART: denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension. In: Annual Meeting of the Association for Computational Linguistics (2019)","DOI":"10.18653\/v1\/2020.acl-main.703"},{"key":"4_CR37","doi-asserted-by":"publisher","first-page":"3416","DOI":"10.1109\/TMM.2021.3097900","volume":"24","author":"C Li","year":"2022","unstructured":"Li, C., Zhang, P., Wang, C.: Harmonious textual layout generation over natural images via deep aesthetics learning. IEEE Trans. Multimedia 24, 3416\u20133428 (2022)","journal-title":"IEEE Trans. Multimedia"},{"key":"4_CR38","doi-asserted-by":"crossref","unstructured":"Li, G., et al.: Learning to denoise raw mobile UI layouts for improving datasets at scale, pp. 1\u201313 (2022)","DOI":"10.1145\/3491102.3502042"},{"key":"4_CR39","unstructured":"Li, J., Li, G., Li, Y., Jin, Z.: Enabling programming thinking in large language models toward code generation. arXiv preprint arXiv:2305.06599 (2023)"},{"issue":"10","key":"4_CR40","doi-asserted-by":"publisher","first-page":"4039","DOI":"10.1109\/TVCG.2020.2999335","volume":"27","author":"J Li","year":"2020","unstructured":"Li, J., Yang, J., Zhang, J., Liu, C., Wang, C., Xu, T.: Attribute-conditioned layout GAN for automatic graphic design. IEEE Trans. Vis. Comput. Graph. 27(10), 4039\u20134048 (2020)","journal-title":"IEEE Trans. Vis. Comput. Graph."},{"key":"4_CR41","doi-asserted-by":"crossref","unstructured":"Li, J., Xu, Y., Cui, L., Wei, F.: MarkupLM: pre-training of text and markup language for visually rich document understanding. In: Annual Meeting of the Association for Computational Linguistics (2021)","DOI":"10.18653\/v1\/2022.acl-long.420"},{"key":"4_CR42","unstructured":"Li, X., Thickstun, J., Gulrajani, I., Liang, P.S., Hashimoto, T.B.: Diffusion-LM improves controllable text generation. In: Advances in Neural Information Processing Systems, vol. 35, pp. 4328\u20134343 (2022)"},{"key":"4_CR43","doi-asserted-by":"crossref","unstructured":"Liu, T.F., et al.: Learning design semantics for mobile apps. In: UIST, pp. 569\u2013579 (2018)","DOI":"10.1145\/3242587.3242650"},{"key":"4_CR44","unstructured":"Loshchilov, I., Hutter, F.: Decoupled weight decay regularization. In: International Conference on Learning Representations (2017)"},{"key":"4_CR45","unstructured":"Lozhkov, A., et al.: StarCoder 2 and the stack v2: the next generation. arXiv preprint arXiv:2402.19173 (2024)"},{"key":"4_CR46","unstructured":"Network, M.D.: Computed value - CSS: Cascading style sheets (2023)"},{"key":"4_CR47","unstructured":"Nichol, A.Q., Dhariwal, P.: Improved denoising diffusion probabilistic models. In: International Conference on Machine Learning, pp. 8162\u20138171. PMLR (2021)"},{"key":"4_CR48","doi-asserted-by":"crossref","unstructured":"O\u2019Donovan, P., Agarwala, A., Hertzmann, A.: DesignScape: design with interactive layout suggestions. In: Proceedings of the 33rd Annual ACM Conference on Human Factors in Computing Systems, pp. 1221\u20131224 (2015)","DOI":"10.1145\/2702123.2702149"},{"key":"4_CR49","unstructured":"van\u00a0den Oord, A., Vinyals, O., Kavukcuoglu, K.: Neural discrete representation learning. In: Guyon, I., et al. (eds.) Advances in Neural Information Processing Systems, vol.\u00a030. Curran Associates, Inc. (2017)"},{"key":"4_CR50","unstructured":"OpenAI: GPT-4 technical report (2023)"},{"key":"4_CR51","unstructured":"Ouyang, L., et al.: Training language models to follow instructions with human feedback. In: Advances in Neural Information Processing Systems, vol. 35, pp. 27730\u201327744 (2022)"},{"issue":"8","key":"4_CR52","doi-asserted-by":"publisher","first-page":"1200","DOI":"10.1109\/TVCG.2014.48","volume":"20","author":"P O\u2019Donovan","year":"2014","unstructured":"O\u2019Donovan, P., Agarwala, A., Hertzmann, A.: Learning layouts for single-pagegraphic designs. IEEE Trans. Vis. Comput. Graph. 20(8), 1200\u20131213 (2014)","journal-title":"IEEE Trans. Vis. Comput. Graph."},{"key":"4_CR53","doi-asserted-by":"crossref","unstructured":"Qiu, Q., Otani, M., Iwazaki, Y.: An intelligent color recommendation tool for landing page design. In: 27th International Conference on Intelligent User Interfaces, pp. 26\u201329 (2022)","DOI":"10.1145\/3490100.3516450"},{"key":"4_CR54","unstructured":"Ramesh, A., Dhariwal, P., Nichol, A., Chu, C., Chen, M.: Hierarchical text-conditional image generation with CLIP latents 1(2), 3. arXiv preprint arXiv:2204.06125 (2022)"},{"key":"4_CR55","unstructured":"Razavi, A., van\u00a0den Oord, A., Vinyals, O.: Generating diverse high-fidelity images with VQ-VAE-2. In: Neural Information Processing Systems (2019)"},{"key":"4_CR56","doi-asserted-by":"crossref","unstructured":"Rombach, R., Blattmann, A., Lorenz, D., Esser, P., Ommer, B.: High-resolution image synthesis with latent diffusion models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10684\u201310695 (2022)","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"4_CR57","unstructured":"Roziere, B., et al.: Code Llama: open foundation models for code. arXiv preprint arXiv:2308.12950 (2023)"},{"issue":"4","key":"4_CR58","first-page":"4713","volume":"45","author":"C Saharia","year":"2022","unstructured":"Saharia, C., Ho, J., Chan, W., Salimans, T., Fleet, D.J., Norouzi, M.: Image super-resolution via iterative refinement. IEEE Trans. Pattern Anal. Mach. Intell. 45(4), 4713\u20134726 (2022)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"4_CR59","doi-asserted-by":"crossref","unstructured":"Shao, Z., et al.: GEM: gestalt enhanced markup language model for web understanding via render tree. In: Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, pp. 6132\u20136145 (2023)","DOI":"10.18653\/v1\/2023.emnlp-main.375"},{"key":"4_CR60","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1515\/nor-2017-0201","volume":"28","author":"L Thorlacius","year":"2007","unstructured":"Thorlacius, L.: The role of aesthetics in web design. Nordicom Rev. 28, 63\u201376 (2007)","journal-title":"Nordicom Rev."},{"key":"4_CR61","unstructured":"Touvron, H., et al.: Llama 2: open foundation and fine-tuned chat models. arXiv preprint arXiv:2307.09288 (2023)"},{"key":"4_CR62","unstructured":"Vaswani, A., et al.: Attention is all you need. In: Advances in Neural Information Processing Systems, vol. 30 (2017)"},{"key":"4_CR63","first-page":"4328400","volume":"2022","author":"P Wang","year":"2022","unstructured":"Wang, P.: The influence of artificial intelligence on visual elements of web page design under machine vision. Comput. Intell. Neurosci. 2022, 4328400 (2022)","journal-title":"Comput. Intell. Neurosci."},{"key":"4_CR64","doi-asserted-by":"crossref","unstructured":"Wertheimer, M.: Gestalt Theory (1938)","DOI":"10.1037\/11496-001"},{"key":"4_CR65","unstructured":"Williams, R.: The Non-Designer\u2019s Design Book: Design and Typographic Principles for the Visual Novice. Pearson Education (2015)"},{"key":"4_CR66","doi-asserted-by":"crossref","unstructured":"Xiang, P., Yang, X., Shi, Y.: Web page segmentation based on gestalt theory. In: 2007 IEEE International Conference on Multimedia and Expo, pp. 2253\u20132256 (2007)","DOI":"10.1109\/ICME.2007.4285135"},{"key":"4_CR67","doi-asserted-by":"publisher","first-page":"11407","DOI":"10.1109\/TPAMI.2023.3277122","volume":"45","author":"Y Xiao","year":"2022","unstructured":"Xiao, Y., et al.: A survey on non-autoregressive generation for neural machine translation and beyond. IEEE Trans. Pattern Anal. Mach. Intell. 45, 11407\u201311427 (2022)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"4_CR68","doi-asserted-by":"crossref","unstructured":"Xie, C., Huang, W., Liang, J., Huang, C., Xiao, Y.: WebKE: knowledge extraction from semi-structured web with pre-trained markup language model. In: Proceedings of the 30th ACM International Conference on Information & Knowledge Management (2021)","DOI":"10.1145\/3459637.3482491"},{"key":"4_CR69","unstructured":"Yang, Z., et al.: The dawn of LMMs: preliminary explorations with GPT-4V (ision) 9. arXiv preprint arXiv:2309.17421 (2023)"},{"key":"4_CR70","doi-asserted-by":"crossref","unstructured":"Zhao, N., Cao, Y., Lau, R.W.: Modeling fonts in context: font prediction on web designs. In: Computer Graphics Forum, vol.\u00a037, pp. 385\u2013395. Wiley Online Library (2018)","DOI":"10.1111\/cgf.13576"},{"key":"4_CR71","doi-asserted-by":"crossref","unstructured":"Zhao, Z., Chen, L., Cao, R., Xu, H., Chen, X., Yu, K.: TIE: topological information enhanced structural reading comprehension on web pages. In: Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, pp. 1808\u20131821 (2022)","DOI":"10.18653\/v1\/2022.naacl-main.132"},{"issue":"4","key":"4_CR72","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3306346.3322971","volume":"38","author":"X Zheng","year":"2019","unstructured":"Zheng, X., Qiao, X., Cao, Y., Lau, R.W.: Content-aware generative modeling of graphic design layouts. ACM Trans. Graph. (TOG) 38(4), 1\u201315 (2019)","journal-title":"ACM Trans. Graph. (TOG)"},{"key":"4_CR73","doi-asserted-by":"crossref","unstructured":"Zhou, M., Xu, C., Ma, Y., Ge, T., Jiang, Y., Xu, W.: Composition-aware graphic layout GAN for visual-textual presentation designs. In: Raedt, L.D. (ed.) Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence, IJCAI 2022, Vienna, Austria, 23\u201329 July 2022, pp. 4995\u20135001. ijcai.org (2022)","DOI":"10.24963\/ijcai.2022\/692"},{"key":"4_CR74","unstructured":"Zhu, Y., Wu, Y., Olszewski, K., Ren, J., Tulyakov, S., Yan, Y.: Discrete contrastive diffusion for cross-modal and conditional generation. arXiv preprint arXiv:2206.07771 (2022)"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-73242-3_4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,28]],"date-time":"2024-10-28T09:26:35Z","timestamp":1730107595000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-73242-3_4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,29]]},"ISBN":["9783031732416","9783031732423"],"references-count":74,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-73242-3_4","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2024,10,29]]},"assertion":[{"value":"29 October 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}