{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,29]],"date-time":"2024-10-29T11:06:15Z","timestamp":1730199975064,"version":"3.28.0"},"reference-count":44,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017,12]]},"DOI":"10.1109\/bigdata.2017.8258223","type":"proceedings-article","created":{"date-parts":[[2018,1,15]],"date-time":"2018-01-15T17:47:28Z","timestamp":1516038448000},"page":"2628-2636","source":"Crossref","is-referenced-by-count":3,"title":["Improving data quality through high precision gender categorization"],"prefix":"10.1109","author":[{"given":"Daniel","family":"Muller","sequence":"first","affiliation":[]},{"given":"Yiea-Funk","family":"Te","sequence":"additional","affiliation":[]},{"given":"Pratiksha","family":"Jain","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1016\/j.archger.2014.04.004"},{"journal-title":"Does the Cream Always Rise to the Top? The Misallocation of Talent in Innovation","year":"2015","author":"celik","key":"ref38"},{"key":"ref33","first-page":"9","author":"goldstone","year":"2017","journal-title":"The Quiet Transformations of Literary Studies What Thirteen Thousand Scholars Could Tell Us Welcome to Project MUSE Connect with Project MUSE"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.4236\/jilsa.2012.43017"},{"key":"ref31","first-page":"1","author":"interface","year":"2017","journal-title":"MRC Psycholinguistic Database"},{"key":"ref30","first-page":"151","author":"hu","year":"2007","journal-title":"Demographic Prediction Based on User's Browsing Behavior"},{"key":"ref37","first-page":"283","author":"jones","year":"2017","journal-title":"The Burden of Knowledge and the 'Death of the Renaissance Man' Is Innovation Getting Harder?"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1016\/j.techfore.2013.08.023"},{"key":"ref35","first-page":"9","volume":"13","author":"tannen","year":"2017","journal-title":"Gender differences in topical coherence Creating involvement in best friends' talk"},{"key":"ref34","first-page":"507","article-title":"Explorations in Economic History Inventing social capital: Evidence from African American inventors, 1843&#x2013;1930 *,'","volume":"48","author":"cook","year":"2011","journal-title":"YEXEH"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1016\/j.bushor.2017.01.002"},{"key":"ref40","first-page":"1","author":"sugimoto","year":"2015","journal-title":"The Academic Advantage Gender Disparities in Patenting"},{"key":"ref11","first-page":"1","article-title":"Jane, John &#x2026; Leslie? A Historical Method for Algorithmic Gender","volume":"9","author":"blevins","year":"2015","journal-title":"Prediction &#x201C;Digit Humanit Q &#x201D;"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.5334\/dsj-2015-002"},{"key":"ref13","first-page":"103","volume":"40","author":"strong","year":"0","journal-title":"Data Quality in Context"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1016\/j.cities.2013.11.006"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/j.respol.2012.11.004"},{"key":"ref16","first-page":"1","author":"milli","year":"2016","journal-title":"The gender patenting gap"},{"key":"ref17","first-page":"149","volume":"24","author":"simkins-bullock","year":"1991","journal-title":"An Investigation into the Relationships Between Gender and Language"},{"journal-title":"Wand Yair Wang Richard Y","year":"1996","author":"data","key":"ref18"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1057\/palgrave.dbm.3240247"},{"key":"ref28","first-page":"1","article-title":"Improving Data Cleaning Quality using a Data Lineage Facility","author":"shasha","year":"1996","journal-title":"Informatica"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/69.404034"},{"key":"ref27","first-page":"191","article-title":"Understanding customer relationship management (CRM): People, process and technology","volume":"21","author":"chen","year":"2017","journal-title":"Bus Process Manag J"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/269012.269021"},{"key":"ref6","article-title":"Record Linkage: Current Practice and Future Directions","author":"gu","year":"2003","journal-title":"Tech Rep"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1145\/505248.506010"},{"journal-title":"Data Quality","year":"2000","author":"orr","key":"ref5"},{"key":"ref8","first-page":"1","article-title":"How Companies Learn Your Secrets","author":"duhigg","year":"2012","journal-title":"N Y Times Magazine"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/s10489-006-0032-0"},{"key":"ref2","first-page":"1","article-title":"Data Quality Considerations for Big Data and Machine Learning: Going Beyond Data Cleaning and Transformations","volume":"10","author":"gudivada","year":"2017","journal-title":"Int J Adv Software"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2014.6816764"},{"key":"ref1","first-page":"1","article-title":"A formal definition of data quality problems","author":"oliveira","year":"2005","journal-title":"2005 Int Conf Inf Qual"},{"key":"ref20","first-page":"1625","article-title":"Handling Missing Values when Applying Classification Models","volume":"8","author":"saar-tsechansky","year":"2007","journal-title":"J Mach Learn Res"},{"key":"ref22","volume":"3367","author":"darley","year":"2017","journal-title":"Gender Differences in Information Processing Strategies An Empirical Test of the Selectivity Model in Advertising Response Gender"},{"key":"ref21","first-page":"1","volume":"3","author":"argamon","year":"2017","journal-title":"DHQ Digital Humanities Quarterly Vive la Diff&#x00E9;rence! Text Mining Gender Difference in French Literature"},{"journal-title":"Cambia","article-title":"Lens patent database","year":"2017","key":"ref42"},{"journal-title":"Gender Differences in Internet Use Patterns and Internet Application Preferences A Two-Sample Comparison","year":"2015","author":"selfie-promotion","key":"ref24"},{"journal-title":"The Statisticain","article-title":"Share of patent applicants that were female in Swizerland from 1980 to 2013 Statista Accounts","year":"2017","key":"ref41"},{"journal-title":"Global Consumer Attitudes Towards Online Shopping","year":"0","author":"shopping","key":"ref23"},{"key":"ref44","article-title":"Federal Statistical Office-Look for Statistics","author":"federal","year":"2017","journal-title":"J Offic Statist"},{"key":"ref26","first-page":"219","author":"sattler","year":"2001","journal-title":"based on a Multidatabase Language"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1098\/rsos.140216"},{"journal-title":"Gender-Based Differences in the Effect of Web Advertising in E-business","year":"2000","author":"xue-wui","key":"ref25"}],"event":{"name":"2017 IEEE International Conference on Big Data (Big Data)","start":{"date-parts":[[2017,12,11]]},"location":"Boston, MA","end":{"date-parts":[[2017,12,14]]}},"container-title":["2017 IEEE International Conference on Big Data (Big Data)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8241556\/8257893\/08258223.pdf?arnumber=8258223","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2018,2,19]],"date-time":"2018-02-19T18:58:16Z","timestamp":1519066696000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/8258223\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,12]]},"references-count":44,"URL":"https:\/\/doi.org\/10.1109\/bigdata.2017.8258223","relation":{},"subject":[],"published":{"date-parts":[[2017,12]]}}}