{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,29]],"date-time":"2024-10-29T11:09:58Z","timestamp":1730200198863,"version":"3.28.0"},"reference-count":36,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,12,10]],"date-time":"2020-12-10T00:00:00Z","timestamp":1607558400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,12,10]],"date-time":"2020-12-10T00:00:00Z","timestamp":1607558400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,12,10]],"date-time":"2020-12-10T00:00:00Z","timestamp":1607558400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,12,10]]},"DOI":"10.1109\/bigdata50022.2020.9377742","type":"proceedings-article","created":{"date-parts":[[2021,3,19]],"date-time":"2021-03-19T17:10:21Z","timestamp":1616173821000},"page":"5727-5729","source":"Crossref","is-referenced-by-count":1,"title":["WebLens: Towards Web-scale Data Integration, Training the Models"],"prefix":"10.1109","author":[{"given":"Rituparna","family":"Khan","sequence":"first","affiliation":[]},{"given":"Michael","family":"Gubanov","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref33","first-page":"1","article-title":"Mllib: Machine learning in apache spark","volume":"17","author":"meng","year":"0","journal-title":"Journal of Machine Learning Research"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1145\/3318464.3380597"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1145\/3318464.3389743"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/s007780100057"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1145\/3318464.3380572"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1145\/2934664"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1145\/3318464.3389726"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1016\/S0169-7552(98)00110-X"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.14778\/1453856.1453916"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.14778\/1453856.1453916"},{"article-title":"Keras","year":"2015","author":"chollet","key":"ref13"},{"article-title":"Keras","year":"2015","author":"chollet","key":"ref14"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/357980.358007"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/3318464.3380605"},{"key":"ref17","article-title":"Hybrid: A large-scale in-memory image analytics system","author":"gubanov","year":"2017","journal-title":"CIDR"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2017.230"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/3041021.3054735"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/3318464.3389779"},{"year":"0","key":"ref4","article-title":"Naive bayes"},{"key":"ref27","article-title":"T. Distributed representations of words and phrases and their compositionality","author":"mikolov","year":"2013","journal-title":"In Advances in Neural Information Processing Systems"},{"year":"0","key":"ref3","article-title":"Multi-layer perceptron, sequential model"},{"article-title":"TensorFlow: Large-scale machine learning on heterogeneous systems","year":"2015","author":"abadi","key":"ref6"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1016\/B978-012722442-8\/50081-1"},{"year":"0","key":"ref5","article-title":"Support vector machine"},{"key":"ref8","first-page":"209","article-title":"Applying model management to classical meta data problems","author":"bernstein","year":"2003","journal-title":"CIDR"},{"key":"ref7","article-title":"Simplifying information integration: Object-based flow-of-mappings framework for integration","author":"alexe","year":"2008","journal-title":"BIRTE"},{"year":"0","key":"ref2","article-title":"Logistic regression"},{"key":"ref9","article-title":"Extracting patterns and relations from the world wide web","author":"brin","year":"1998","journal-title":"EDBT"},{"year":"0","key":"ref1","article-title":"Here is the toothbrush test google&#x2019;s ceo uses to make acquisition decisions"},{"key":"ref20","article-title":"Readfast: High-relevance search-engine for big text","author":"gubanov","year":"2013","journal-title":"ACM CIKM"},{"key":"ref22","article-title":"Large-scale semantic profile extraction","author":"gubanov","year":"2014","journal-title":"EDBT"},{"key":"ref21","article-title":"Type-aware web search","author":"gubanov","year":"2014","journal-title":"EDBT"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2005.39"},{"key":"ref23","article-title":"Metadata management engine for data integration with reverse-engineering support","author":"gubanov","year":"2008","journal-title":"ICDE"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/872781.872782"},{"key":"ref25","article-title":"Elmo: Deep contextualized word representations","author":"matthew","year":"2018","journal-title":"NAACL"}],"event":{"name":"2020 IEEE International Conference on Big Data (Big Data)","start":{"date-parts":[[2020,12,10]]},"location":"Atlanta, GA, USA","end":{"date-parts":[[2020,12,13]]}},"container-title":["2020 IEEE International Conference on Big Data (Big Data)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9377717\/9377728\/09377742.pdf?arnumber=9377742","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,27]],"date-time":"2022-06-27T11:59:10Z","timestamp":1656331150000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9377742\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,12,10]]},"references-count":36,"URL":"https:\/\/doi.org\/10.1109\/bigdata50022.2020.9377742","relation":{},"subject":[],"published":{"date-parts":[[2020,12,10]]}}}