{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T05:02:51Z","timestamp":1750309371813,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":53,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,8,20]],"date-time":"2024-08-20T00:00:00Z","timestamp":1724112000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,8,20]]},"DOI":"10.1145\/3685650.3685665","type":"proceedings-article","created":{"date-parts":[[2024,9,18]],"date-time":"2024-09-18T10:19:28Z","timestamp":1726654768000},"page":"1-9","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["CatalogBank: A Structured and Interoperable Catalog Dataset with a Semi-Automatic Annotation Tool (DocumentLabeler) for Engineering System Design"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-0626-2664","authenticated-orcid":false,"given":"Hasan Sinan","family":"Bank","sequence":"first","affiliation":[{"name":"Colorado State University, Fort Collins, Colorado, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4995-7375","authenticated-orcid":false,"given":"Daniel R.","family":"Herber","sequence":"additional","affiliation":[{"name":"Colorado State University, Fort Collins, Colorado, USA"}]}],"member":"320","published-online":{"date-parts":[[2024,9,18]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"CatalogBank: A Structural and Interoperable Catalog Database for Engineering System Design. https:\/\/github.com\/bankh\/CatalogBank. [Online","author":"H.S.","year":"2024","unstructured":"Bank, H.S. 2024. CatalogBank: A Structural and Interoperable Catalog Database for Engineering System Design. https:\/\/github.com\/bankh\/CatalogBank. [Online; accessed 17-April-2024]."},{"key":"e_1_3_2_1_2_1","volume-title":"DocumentLabeler: A Tool for Semi-Automated Labeling of Document Data. https:\/\/github.com\/bankh\/DocumentLabeler. [Online","author":"H.S.","year":"2024","unstructured":"Bank, H.S. 2024. DocumentLabeler: A Tool for Semi-Automated Labeling of Document Data. https:\/\/github.com\/bankh\/DocumentLabeler. [Online; accessed 17-April-2024]."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1115\/DETC2006-99518"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1115\/1.4029065"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1115\/DETC2016-59551"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.18260\/1-2--42724"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"crossref","unstructured":"Fabrizio Dell'Acqua Edward McFowland Ethan R Mollick Hila Lifshitz-Assaf Katherine Kellogg Saran Rajendran Lisa Krayer Fran\u00e7ois Candelon and Karim R Lakhani. 2023. Navigating the jagged technological frontier: Field experimental evidence of the effects of AI on knowledge worker productivity and quality. Harvard Business School Technology & Operations Mgt. Unit Working Paper 24-013 (2023).","DOI":"10.2139\/ssrn.4573321"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/1147197.1147210"},{"key":"e_1_3_2_1_9_1","volume-title":"Gpts are gpts: An early look at the labor market impact potential of large language models. arXiv preprint arXiv:2303.10130","author":"Eloundou Tyna","year":"2023","unstructured":"Tyna Eloundou, Sam Manning, Pamela Mishkin, and Daniel Rock. 2023. Gpts are gpts: An early look at the labor market impact potential of large language models. arXiv preprint arXiv:2303.10130 (2023)."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/3469096.3474933"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/2361354.2361385"},{"key":"e_1_3_2_1_12_1","volume-title":"Design prototypes: a knowledge representation schema for design. AI magazine 11, 4","author":"Gero John S","year":"1990","unstructured":"John S Gero. 1990. Design prototypes: a knowledge representation schema for design. AI magazine 11, 4 (1990), 26--26."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2019.00049"},{"key":"e_1_3_2_1_14_1","volume-title":"Thomas M\u00fcller, Francesco Piccinno, and Julian Martin Eisenschlos.","author":"Herzig Jonathan","year":"2020","unstructured":"Jonathan Herzig, Pawe\u0142 Krzysztof Nowak, Thomas M\u00fcller, Francesco Piccinno, and Julian Martin Eisenschlos. 2020. TaPas: Weakly supervised table parsing via pre-training. arXiv preprint arXiv:2004.02349 (2020)."},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2019.00244"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDARW.2019.10029"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19815-1_29"},{"key":"e_1_3_2_1_18_1","volume-title":"Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980","author":"Kingma Diederik P","year":"2014","unstructured":"Diederik P Kingma and Jimmy Ba. 2014. Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980 (2014)."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00983"},{"key":"e_1_3_2_1_20_1","volume-title":"Imagenet classification with deep convolutional neural networks. Advances in neural information processing systems 25","author":"Krizhevsky Alex","year":"2012","unstructured":"Alex Krizhevsky, Ilya Sutskever, and Geoffrey E Hinton. 2012. Imagenet classification with deep convolutional neural networks. Advances in neural information processing systems 25 (2012)."},{"key":"e_1_3_2_1_21_1","volume-title":"Proceedings of the Twelfth Language Resources and Evaluation Conference. 1918--1925","author":"Li Minghao","year":"2020","unstructured":"Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming Zhou, and Zhoujun Li. 2020. Tablebank: Table benchmark for image-based table detection and recognition. In Proceedings of the Twelfth Language Resources and Evaluation Conference. 1918--1925."},{"key":"e_1_3_2_1_22_1","volume-title":"DocBank: A benchmark dataset for document layout analysis. arXiv preprint arXiv:2006.01038","author":"Li Minghao","year":"2020","unstructured":"Minghao Li, Yiheng Xu, Lei Cui, Shaohan Huang, Furu Wei, Zhoujun Li, and Ming Zhou. 2020. DocBank: A benchmark dataset for document layout analysis. arXiv preprint arXiv:2006.01038 (2020)."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/3573128.3604903"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/3469096.3470833"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1093\/ijl\/3.4.235"},{"key":"e_1_3_2_1_26_1","volume-title":"doccano: Text annotation tool for human. Software available from https:\/\/github. com\/doccano\/doccano","author":"Nakayama Hiroki","year":"2018","unstructured":"Hiroki Nakayama, Takahiro Kubo, Junya Kamura, Yasufumi Taniguchi, and Xu Liang. 2018. doccano: Text annotation tool for human. Software available from https:\/\/github. com\/doccano\/doccano (2018), 34."},{"key":"e_1_3_2_1_27_1","volume-title":"International conference on machine learning. PMLR, 7220--7229","author":"Nash Charlie","year":"2020","unstructured":"Charlie Nash, Yaroslav Ganin, SM Ali Eslami, and Peter Battaglia. 2020. Polygen: An autoregressive generative model of 3d meshes. In International conference on machine learning. PMLR, 7220--7229."},{"key":"e_1_3_2_1_28_1","volume-title":"Md Ferdous Alam, and Faez Ahmed","author":"Picard Cyril","year":"2023","unstructured":"Cyril Picard, Kristen M Edwards, Anna C Doris, Brandon Man, Giorgio Giannone, Md Ferdous Alam, and Faez Ahmed. 2023. From Concept to Manufacturing: Evaluating Vision-Language Models for Engineering Design. arXiv preprint arXiv:2311.12668 (2023)."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2019.00031"},{"key":"e_1_3_2_1_30_1","unstructured":"Alec Radford Jeffrey Wu Rewon Child David Luan Dario Amodei Ilya Sutskever et al. 2019. Language models are unsupervised multitask learners. OpenAI blog 1 8 (2019) 9."},{"key":"e_1_3_2_1_31_1","first-page":"021404","article-title":"Design strategy network: a deep hierarchical framework to represent generative design strategies in complex action spaces","volume":"144","author":"Raina Ayush","year":"2022","unstructured":"Ayush Raina, Jonathan Cagan, and Christopher McComb. 2022. Design strategy network: a deep hierarchical framework to represent generative design strategies in complex action spaces. Journal of Mechanical Design 144, 2 (2022), 021404.","journal-title":"Journal of Mechanical Design"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1115\/1.4053859"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-007-0090-8"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.compind.2022.103791"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2019.112995"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2017.192"},{"key":"e_1_3_2_1_37_1","volume-title":"Hidden technical debt in machine learning systems. Advances in neural information processing systems 28","author":"Sculley David","year":"2015","unstructured":"David Sculley, Gary Holt, Daniel Golovin, Eugene Davydov, Todd Phillips, Dietmar Ebner, Vinay Chaudhary, Michael Young, Jean-Francois Crespo, and Dan Dennison. 2015. Hidden technical debt in machine learning systems. Advances in neural information processing systems 28 (2015)."},{"volume-title":"Consciousness and language","author":"Searle John R","key":"e_1_3_2_1_38_1","unstructured":"John R Searle. 2002. Consciousness and language. Cambridge University Press."},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1115\/1.4037649"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01855"},{"key":"e_1_3_2_1_41_1","volume-title":"Conceptnet at semeval-2017 task 2: Extending word embeddings with multilingual relational knowledge. arXiv preprint arXiv:1704.03560","author":"Speer Robyn","year":"2017","unstructured":"Robyn Speer and Joanna Lowry-Duda. 2017. Conceptnet at semeval-2017 task 2: Extending word embeddings with multilingual relational knowledge. arXiv preprint arXiv:1704.03560 (2017)."},{"volume-title":"The NIST design repository project","author":"Szykman Simon","key":"e_1_3_2_1_42_1","unstructured":"Simon Szykman, Ram D Sriram, Christophe Bochenek, and Janusz Racz. 1999. The NIST design repository project. Springer."},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/2494266.2494323"},{"key":"e_1_3_2_1_44_1","unstructured":"Tzutalin. 2015. LabelImg. https:\/\/github.com\/tzutalin\/labelImg. Retrieved from Internet on 2023-01-14."},{"key":"e_1_3_2_1_45_1","volume-title":"Attention is all you need. Advances in neural information processing systems 30","author":"Vaswani Ashish","year":"2017","unstructured":"Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, \u0141ukasz Kaiser, and Illia Polosukhin. 2017. Attention is all you need. Advances in neural information processing systems 30 (2017)."},{"key":"e_1_3_2_1_46_1","volume-title":"The engineering design revolution: the people, companies and computer systems that changed forever the practice of engineering","author":"Weisberg David E","year":"2008","unstructured":"David E Weisberg. 2008. The engineering design revolution: the people, companies and computer systems that changed forever the practice of engineering. Cyon Research Corporation (2008), 1--26."},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.1115\/DETC2020-22256"},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.1145\/3450626.3459818"},{"key":"e_1_3_2_1_49_1","first-page":"1","article-title":"Tractatus logico-philosophicus by Ludwig Wittgenstein","volume":"59","author":"Wittgenstein Ludwig","year":"1922","unstructured":"Ludwig Wittgenstein. 1922. Tractatus logico-philosophicus by Ludwig Wittgenstein. J. Hist. Ideas 59 (1922), 1--28.","journal-title":"J. Hist. Ideas"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394486.3403172"},{"key":"e_1_3_2_1_51_1","volume-title":"Layoutxlm: Multimodal pre-training for multilingual visually-rich document understanding. arXiv preprint arXiv:2104.08836","author":"Xu Yiheng","year":"2021","unstructured":"Yiheng Xu, Tengchao Lv, Lei Cui, Guoxin Wang, Yijuan Lu, Dinei Florencio, Cha Zhang, and Furu Wei. 2021. Layoutxlm: Multimodal pre-training for multilingual visually-rich document understanding. arXiv preprint arXiv:2104.08836 (2021)."},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR48806.2021.9412927"},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2019.00166"}],"event":{"name":"DocEng '24: ACM Symposium on Document Engineering 2024","sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web"],"location":"San Jose CA USA","acronym":"DocEng '24"},"container-title":["Proceedings of the ACM Symposium on Document Engineering 2024"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3685650.3685665","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3685650.3685665","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T00:06:18Z","timestamp":1750291578000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3685650.3685665"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,8,20]]},"references-count":53,"alternative-id":["10.1145\/3685650.3685665","10.1145\/3685650"],"URL":"https:\/\/doi.org\/10.1145\/3685650.3685665","relation":{},"subject":[],"published":{"date-parts":[[2024,8,20]]},"assertion":[{"value":"2024-09-18","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}