{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T17:53:02Z","timestamp":1743097982134,"version":"3.40.3"},"publisher-location":"Cham","reference-count":47,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031696213"},{"type":"electronic","value":"9783031696220"}],"license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024]]},"DOI":"10.1007\/978-3-031-69622-0_5","type":"book-chapter","created":{"date-parts":[[2024,12,17]],"date-time":"2024-12-17T19:46:05Z","timestamp":1734464765000},"page":"83-104","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Evolution on the Generation and Analysis of Single Imputation Synthetic Datasets in Statistical Disclosure Control"],"prefix":"10.1007","author":[{"given":"Ricardo","family":"Moura","sequence":"first","affiliation":[]},{"given":"Carlos A.","family":"Coelho","sequence":"additional","affiliation":[]},{"given":"Bimal","family":"Sinha","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,12,18]]},"reference":[{"key":"5_CR1","volume-title":"Final report to the social security administration on the SIPP\/SSA\/IRS public use file project","author":"J M Abowd","year":"2006","unstructured":"Abowd, J. M., Stinson, M. H., & Benedetto, G. (2006). Final report to the social security administration on the SIPP\/SSA\/IRS public use file project. https:\/\/ecommons.cornell.edu\/items\/d7cf980e-5ec3-4322-aea2-a58b344c3ac6"},{"key":"5_CR2","unstructured":"Abowd, J., Benedetto, G., Garfinkel, S., Dahl, S., Dajani, A., Graham, M., Hawes, M., Karwa, V., Kifer, D., Kim, H., Leclerc, P., Machanavajjhala, A., Reiter, J., Rodrigues, R., Schmutte, I., Sexton, W., Singer, P., & Vilhuber, L. (2020). The modernization of statistical disclosure limitation at the U.S. Census Bureau. Working Paper Number CED-WP-2020-009."},{"issue":"4","key":"5_CR3","doi-asserted-by":"publisher","first-page":"212","DOI":"10.21307\/stattrans-2020-039","volume":"21","author":"M J Alam","year":"2020","unstructured":"Alam, M. J., Dostie, B., Drechsler, J., & Vilhuber, L. (2020). Applying data synthesis for longitudinal business data across three countries. Statistics in Transition New Series, 21(4), 212\u2013236.","journal-title":"Statistics in Transition New Series"},{"key":"5_CR4","doi-asserted-by":"publisher","first-page":"923","DOI":"10.1111\/j.1467-985X.2007.00492.x","volume":"170","author":"D An","year":"2007","unstructured":"An, D., & Little, R. J. A. (2007). Multiple imputation: An alternative to top coding for statistical disclosure control. Journal of the Royal Statistical Society, Series A, 170, 923\u2013940.","journal-title":"Journal of the Royal Statistical Society, Series A"},{"key":"5_CR5","doi-asserted-by":"crossref","unstructured":"Basak, B. and Sinha, B. (2024). Analysis of one-way anova model using synthetic data. Sankhya B, pages 1\u201327.","DOI":"10.1007\/s13571-023-00318-4"},{"key":"5_CR6","doi-asserted-by":"crossref","unstructured":"Bowen, C. M., Bryant, V., Burman, L., Khitatrakun, S., McClelland, R., Stallworth, P., Ueyama, K., & Williams, A. R. (2020). A synthetic supplemental public use file of low-income information return data: Methodology, utility, and privacy implications. In Privacy in statistical databases: UNESCO chair in data privacy, international conference, PSD 2020, Tarragona, Spain, September 23\u201325, 2020, Proceedings (pp. 257\u2013270). Springer International Publishing.","DOI":"10.1007\/978-3-030-57521-2_18"},{"issue":"1","key":"5_CR7","first-page":"27","volume":"3","author":"G Caiola","year":"2010","unstructured":"Caiola, G., & Reiter, J. P. (2010). Random forests for generating partially synthetic, categorical data. Transactions on Data Privacy, 3(1), 27\u201342.","journal-title":"Transactions on Data Privacy"},{"key":"5_CR8","series-title":"In Privacy in statistical databases: UNESCO chair in data privacy, international conference, PSD 2010, Corfu, Greece, September 22\u201324, 2010. Proceedings (pp. 148\u2013161)","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-15838-4_14","volume-title":"Using support vector machines for generating synthetic datasets","author":"J Drechsler","year":"2010","unstructured":"Drechsler, J. (2010). Using support vector machines for generating synthetic datasets. In Privacy in statistical databases: UNESCO chair in data privacy, international conference, PSD 2010, Corfu, Greece, September 22\u201324, 2010. Proceedings (pp. 148\u2013161). Springer Berlin Heidelberg."},{"key":"5_CR9","doi-asserted-by":"crossref","unstructured":"Drechsler, J. (2011). Synthetic datasets for statistical disclosure control: Theory and implementation (Vol. 201). Springer Science & Business Media.","DOI":"10.1007\/978-1-4614-0326-5"},{"key":"5_CR10","volume":"2304","author":"J Drechsler","year":"2023","unstructured":"Drechsler, J., & Haensch, A. C. (2023). 30 years of synthetic data. Preprint, arXiv:2304.02107.","journal-title":"Preprint, arXiv"},{"issue":"2","key":"5_CR11","first-page":"25","volume":"22","author":"A Guin","year":"2022","unstructured":"Guin, A., Roy, A., & Sinha, B. (2022). Bayesian analysis of multiply imputed synthetic data under the multiple linear regression model. International Journal of Statistical Sciences, 22(2), 25\u201338.","journal-title":"International Journal of Statistical Sciences"},{"issue":"2","key":"5_CR12","doi-asserted-by":"publisher","first-page":"1","DOI":"10.3329\/ijss.v23i2.70112","volume":"23","author":"A Guin","year":"2023","unstructured":"Guin, A., Roy, A., & Sinha, B. (2023). Bayesian analysis of singly imputed synthetic data under the multivariate normal model. International Journal of Statistical Sciences, 23(2), 1\u201318.","journal-title":"International Journal of Statistical Sciences"},{"key":"5_CR13","unstructured":"Hundepool, A., Domingo-Ferrer, J., Franconi, L., Giessing, S., Lenz, R., Longhurst, J., Nordholt, E. S., Seri, G., & Wolf, P. (2010). Handbook on statistical disclosure control. ESSnet on Statistical Disclosure Control. https:\/\/cros.ec.europa.eu\/system\/files\/2023-12\/SDC_Handbook.pdf"},{"key":"5_CR14","first-page":"248","volume":"1997","author":"A B Kennickell","year":"1997","unstructured":"Kennickell, A. B. (1997). Multiple imputation and disclosure protection: The case of the 1995 survey of consumer finances. Record Linkage Techniques, 1997, 248\u2013267.","journal-title":"Record Linkage Techniques"},{"issue":"3","key":"5_CR15","doi-asserted-by":"publisher","first-page":"362","DOI":"10.1111\/j.1751-5823.2011.00153.x","volume":"79","author":"S K Kinney","year":"2011","unstructured":"Kinney, S. K., Reiter, J. P., Reznek, A. P., Miranda, J., Jarmin, R. S., & Abowd, J. M. (2011). Towards unrestricted public use business microdata: The synthetic longitudinal business database. International Statistical Review, 79(3), 362\u2013384.","journal-title":"International Statistical Review"},{"key":"5_CR16","doi-asserted-by":"crossref","unstructured":"Kinney, S. K., Reiter, J. P., & Miranda, J. (2014). Improving the synthetic longitudinal business database. US Census Bureau Center for Economic Studies.","DOI":"10.2139\/ssrn.2423400"},{"key":"5_CR17","doi-asserted-by":"publisher","first-page":"293","DOI":"10.1007\/s13571-015-0100-8","volume":"77","author":"M Klein","year":"2015","unstructured":"Klein, M., & Sinha, B. (2015a). Inference for singly imputed synthetic data based on posterior predictive sampling under multivariate normal and multiple linear regression models. Sankhya B, 77, 293\u2013311.","journal-title":"Sankhya B"},{"issue":"1","key":"5_CR18","doi-asserted-by":"publisher","first-page":"43","DOI":"10.29012\/jpc.v7i1.645","volume":"7","author":"M Klein","year":"2015","unstructured":"Klein, M., & Sinha, B. (2015b). Likelihood based finite sample inference for singly imputed synthetic data under the multivariate normal and multiple linear regression models. Journal of Privacy and Confidentiality, 7(1), 43\u201398.","journal-title":"Journal of Privacy and Confidentiality"},{"issue":"1","key":"5_CR19","first-page":"33","volume":"13","author":"M Klein","year":"2015","unstructured":"Klein, M., & Sinha, B. (2015c). Likelihood-based finite sample inference for synthetic data based on exponential model. Thailand Statistician, 13(1), 33\u201347.","journal-title":"Thailand Statistician"},{"key":"5_CR20","doi-asserted-by":"publisher","first-page":"168","DOI":"10.1016\/j.spl.2015.06.003","volume":"105","author":"M Klein","year":"2015","unstructured":"Klein, M., & Sinha, B. (2015d). Likelihood-based inference for singly and multiply imputed synthetic data under a normal model. Statistics & Probability Letters, 105, 168\u2013175.","journal-title":"Statistics & Probability Letters"},{"key":"5_CR21","doi-asserted-by":"publisher","first-page":"100","DOI":"10.1080\/15598608.2017.1350606","volume":"12","author":"M D Klein","year":"2018","unstructured":"Klein, M. D., & and Datta, G. S. (2018). Statistical disclosure control via sufficiency under the multiple linear regression model. Journal of Statistical Theory and Practice, 12, 100\u2013110.","journal-title":"Journal of Statistical Theory and Practice"},{"key":"5_CR22","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1007\/s13571-019-00215-9","volume":"83","author":"M Klein","year":"2021","unstructured":"Klein, M., Moura, R., & Sinha, B. (2021). Multivariate normal inference based on singly imputed synthetic data under plug-in sampling. Sankhya B, 83, 273\u2013287.","journal-title":"Sankhya B"},{"issue":"11","key":"5_CR23","doi-asserted-by":"publisher","first-page":"1667","DOI":"10.1093\/jamia\/ocaa127","volume":"27","author":"A Koivu","year":"2020","unstructured":"Koivu, A., Sairanen, M., Airola, A., & Pahikkala, T. (2020). Synthetic minority oversampling of vital statistics data with generative adversarial networks. Journal of the American Medical Informatics Association, 27(11), 1667\u20131674.","journal-title":"Journal of the American Medical Informatics Association"},{"key":"5_CR24","first-page":"407","volume":"9","author":"R J A Little","year":"1993","unstructured":"Little, R. J. A. (1993). Statistical analysis of masked data. Journal of Official Statistics, 9, 407\u2013426.","journal-title":"Journal of Official Statistics"},{"key":"5_CR25","first-page":"11237","volume":"33","author":"C Ma","year":"2020","unstructured":"Ma, C., Tschiatschek, S., Turner, R., Hern\u00e1ndez-Lobato, J. M., & Zhang, C. (2020). Vaem: A deep generative model for heterogeneous mixed type data. Advances in Neural Information Processing Systems, 33, 11237\u201311247.","journal-title":"Advances in Neural Information Processing Systems"},{"issue":"5","key":"5_CR26","first-page":"655","volume":"20","author":"N Mishra","year":"2022","unstructured":"Mishra, N., & Barui, S. (2022). Likelihood-based finite sample inference for synthetic data from pareto model. REVSTAT-Statistical Journal, 20(5), 655\u2013676.","journal-title":"REVSTAT-Statistical Journal"},{"key":"5_CR27","unstructured":"Moura, R. P. (2016). Likelihood-based inference for multivariate regression models using synthetic data. Ph.D. Thesis, Universidade NOVA de Lisboa, Portugal."},{"issue":"2","key":"5_CR28","first-page":"155","volume":"15","author":"R Moura","year":"2017","unstructured":"Moura, R., Klein, M., Coelho, C. A., & Sinha, B. (2017). Inference for multivariate regression model based on synthetic data generated under fixed-posterior predictive sampling. REVSTAT: Statistical Journal, 15(2), 155\u2013186.","journal-title":"REVSTAT: Statistical Journal"},{"issue":"534","key":"5_CR29","doi-asserted-by":"publisher","first-page":"720","DOI":"10.1080\/01621459.2021.1900860","volume":"116","author":"R Moura","year":"2021","unstructured":"Moura, R., Klein, M., Zylstra, J., Coelho, C. A., & Sinha, B. (2021). Inference for multivariate regression model based on synthetic data generated using plug-in sampling. Journal of the American Statistical Association, 116(534), 720\u2013733.","journal-title":"Journal of the American Statistical Association"},{"key":"5_CR30","doi-asserted-by":"crossref","unstructured":"Moura, R., Norouzirad, M., & Mazarei, D. (2023). Psinference: Inference for released plug-in sampling single synthetic dataset. Computer software. https:\/\/github.com\/ricardomourarpm\/PSinference.","DOI":"10.32614\/CRAN.package.PSinference"},{"issue":"10","key":"5_CR31","doi-asserted-by":"publisher","first-page":"1071","DOI":"10.14778\/3231751.3231757","volume":"11","author":"N Park","year":"2018","unstructured":"Park, N., Mohammadi, M., Gorde, K., Jajodia, S., Park, H., & Kim, Y. (2018). Data synthesis based on generative adversarial networks. Proceedings of the VLDB Endowment, 11(10), 1071\u20131083.","journal-title":"Proceedings of the VLDB Endowment"},{"issue":"3","key":"5_CR32","doi-asserted-by":"publisher","first-page":"67","DOI":"10.29012\/jpc.v7i3.407","volume":"7","author":"G M Raab","year":"2018","unstructured":"Raab, G. M., Nowok, B., & Dibben, C. (2018). Practical data synthesis for large samples. Journal of Privacy and Confidentiality, 7(3), 67\u201397.","journal-title":"Journal of Privacy and Confidentiality"},{"issue":"1","key":"5_CR33","first-page":"85","volume":"27","author":"T E Raghunathan","year":"2001","unstructured":"Raghunathan, T. E., Lepkowski, J. M., Van Hoewyk, J., Solenberger, P., et al. (2001). A multivariate technique for multiply imputing missing values using a sequence of regression models. Survey Methodology, 27(1), 85\u201396.","journal-title":"Survey Methodology"},{"key":"5_CR34","first-page":"1","volume":"19","author":"T E Raghunathan","year":"2003","unstructured":"Raghunathan, T. E., Reiter, J. P., & Rubin, D. B. (2003). Multiple imputation for statistical disclosure limitation. Journal of Official Statistics, 19, 1\u201316.","journal-title":"Journal of Official Statistics"},{"issue":"4","key":"5_CR35","first-page":"531","volume":"18","author":"J P Reiter","year":"2002","unstructured":"Reiter, J. P. (2002). Satisfying disclosure restrictions with synthetic data sets. Journal of Official Statistics, 18(4), 531.","journal-title":"Journal of Official Statistics"},{"key":"5_CR36","first-page":"181","volume":"29","author":"J P Reiter","year":"2003","unstructured":"Reiter, J. P. (2003). Inference for partially synthetic, public use microdata sets. Survey Methodology, 29, 181\u2013188.","journal-title":"Survey Methodology"},{"issue":"1","key":"5_CR37","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1111\/j.1467-985X.2004.00343.x","volume":"168","author":"J P Reiter","year":"2005","unstructured":"Reiter, J. P. (2005a). Releasing multiply imputed, synthetic public use microdata: An illustration and empirical study. Journal of the Royal Statistical Society: Series A (Statistics in Society), 168(1), 185\u2013205.","journal-title":"Journal of the Royal Statistical Society: Series A (Statistics in Society)"},{"issue":"2","key":"5_CR38","doi-asserted-by":"publisher","first-page":"365","DOI":"10.1016\/j.jspi.2004.02.003","volume":"131","author":"J P Reiter","year":"2005","unstructured":"Reiter, J. P. (2005b). Significance tests for multi-component estimands from multiply imputed, synthetic microdata. Journal of Statistical Planning and Inference, 131(2), 365\u2013377.","journal-title":"Journal of Statistical Planning and Inference"},{"issue":"3","key":"5_CR39","first-page":"441","volume":"21","author":"J P Reiter","year":"2005","unstructured":"Reiter, J. P. (2005c). Using CART to generate partially synthetic public use microdata. Journal of Official Statistics, 21(3), 441\u2013462.","journal-title":"Journal of Official Statistics"},{"issue":"4","key":"5_CR40","first-page":"583","volume":"28","author":"J P Reiter","year":"2012","unstructured":"Reiter, J. P., & Kinney, S. K. (2012). Inferentially valid, partially synthetic data: Generating from posterior predictive distributions not necessary. Journal of Official Statistics, 28(4), 583.","journal-title":"Journal of Official Statistics"},{"key":"5_CR41","doi-asserted-by":"crossref","unstructured":"Reiter, J. P., & Raghunathan, T. E. (2007). The multiple adaptations of multiple imputation. Journal of the American Statistical Association, 1462\u20131471.","DOI":"10.1198\/016214507000000932"},{"key":"5_CR42","doi-asserted-by":"crossref","unstructured":"Reiter, J. P., Wang, Q., & Zhang, B. (2014). Bayesian estimation of disclosure risks for multiply imputed, synthetic data. Journal of Privacy and Confidentiality, 6(1).","DOI":"10.29012\/jpc.v6i1.635"},{"key":"5_CR43","doi-asserted-by":"publisher","DOI":"10.1002\/9780470316696","volume-title":"Multiple imputation for nonresponse in surveys","author":"D B Rubin","year":"1987","unstructured":"Rubin, D. B. (1987). Multiple imputation for nonresponse in surveys. Wiley."},{"key":"5_CR44","first-page":"461","volume":"9","author":"D B Rubin","year":"1993","unstructured":"Rubin, D. B. (1993). Discussion: Statistical disclosure limitation. Journal of Official Statistics, 9, 461\u2013468.","journal-title":"Journal of Official Statistics"},{"key":"5_CR45","unstructured":"Srivastava, A., Valkov, L., Russell, C., Gutmann, M. U., & Sutton, C. (2017). Veegan: Reducing mode collapse in gans using implicit variational learning. Advances in Neural Information Processing Systems, 30."},{"key":"5_CR46","unstructured":"Vardhan, L. V. H., & Kok, S. (2020). Generating privacy-preserving synthetic tabular data using oblivious variational autoencoders. In Proceedings of the workshop on economics of privacy and data labor at the 37th international conference on machine learning (ICML)."},{"key":"5_CR47","unstructured":"Xu, L., Skoularidou, M., Cuesta-Infante, A., & Veeramachaneni, K. (2019). Modeling tabular data using conditional GAN. In Advances in neural information processing systems (Vol. 32). Curran Associates, Inc."}],"container-title":["Emerging Topics in Statistics and Biostatistics","Statistical Modeling and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-69622-0_5","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,12,17]],"date-time":"2024-12-17T20:02:10Z","timestamp":1734465730000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-69622-0_5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"ISBN":["9783031696213","9783031696220"],"references-count":47,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-69622-0_5","relation":{},"ISSN":["2524-7735","2524-7743"],"issn-type":[{"type":"print","value":"2524-7735"},{"type":"electronic","value":"2524-7743"}],"subject":[],"published":{"date-parts":[[2024]]},"assertion":[{"value":"18 December 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}