{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,11]],"date-time":"2025-12-11T20:18:48Z","timestamp":1765484328958,"version":"3.37.3"},"reference-count":38,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2022,12,30]],"date-time":"2022-12-30T00:00:00Z","timestamp":1672358400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,12,30]],"date-time":"2022-12-30T00:00:00Z","timestamp":1672358400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100010909","name":"Young Scientists Fund","doi-asserted-by":"publisher","award":["11901573"],"award-info":[{"award-number":["11901573"]}],"id":[{"id":"10.13039\/501100010909","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Comput Stat"],"published-print":{"date-parts":[[2024,4]]},"DOI":"10.1007\/s00180-022-01319-z","type":"journal-article","created":{"date-parts":[[2022,12,30]],"date-time":"2022-12-30T05:02:38Z","timestamp":1672376558000},"page":"709-732","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Deterministic subsampling for logistic regression with massive data"],"prefix":"10.1007","volume":"39","author":[{"given":"Yan","family":"Song","sequence":"first","affiliation":[]},{"given":"Wenlin","family":"Dai","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,12,30]]},"reference":[{"issue":"2","key":"1319_CR1","first-page":"749","volume":"31","author":"M Ai","year":"2021","unstructured":"Ai M, Yu J, Zhang H, Wang H (2021) Optimal subsampling algorithms for big data regressions. Stat Sin 31(2):749\u2013772","journal-title":"Stat Sin"},{"key":"1319_CR2","doi-asserted-by":"publisher","DOI":"10.1093\/oso\/9780199296590.001.0001","volume-title":"Optimum experimental designs, with SAS","author":"A Atkinson","year":"2007","unstructured":"Atkinson A, Donev A, Tobias R (2007) Optimum experimental designs, with SAS. Oxford University Press, New York"},{"key":"1319_CR3","doi-asserted-by":"publisher","first-page":"4308","DOI":"10.1038\/ncomms5308","volume":"5","author":"P Baldi","year":"2014","unstructured":"Baldi P, Sadowski P, Whiteson D (2014) Searching for exotic particles in high-energy physics with deep learning. Nat Commun 5:4308","journal-title":"Nat Commun"},{"issue":"1","key":"1319_CR4","doi-asserted-by":"publisher","first-page":"348","DOI":"10.1137\/19M1261717","volume":"58","author":"B Bercu","year":"2020","unstructured":"Bercu B, Godichon A, Portier B (2020) An efficient stochastic Newton algorithm for parameter estimation in logistic regressions. SIAM J Control Optim 58(1):348\u2013367","journal-title":"SIAM J Control Optim"},{"key":"1319_CR5","unstructured":"Besanson G (2015) FastKNN: fast k-nearest neighbors. R package version 0.0.1"},{"issue":"1","key":"1319_CR6","first-page":"3","volume":"1","author":"A Beygelzimer","year":"2019","unstructured":"Beygelzimer A, Kakadet S, Langford J, Arya S, Mount D, Li S (2019) FNN: fast nearest neighbor search algorithms and applications. R Package Version 1(1):3","journal-title":"R Package Version"},{"key":"1319_CR7","unstructured":"Chau H, Kirkby J, Nguyen D, Nguyen D, Nguyen N, Nguyen T (2022) On the inversion-free Newton\u2019s method and its applications. Working paper"},{"key":"1319_CR8","doi-asserted-by":"publisher","first-page":"112","DOI":"10.1016\/j.jspi.2020.03.004","volume":"209","author":"Q Cheng","year":"2020","unstructured":"Cheng Q, Wang H, Yang M (2020) Information-based optimal subdata selection for big data logistic regression. J Stat Plan Inference 209:112\u2013122","journal-title":"J Stat Plan Inference"},{"key":"1319_CR9","doi-asserted-by":"publisher","first-page":"310","DOI":"10.1051\/ps\/2018021","volume":"23","author":"S Cl\u00e9men\u00e7on","year":"2019","unstructured":"Cl\u00e9men\u00e7on S, Bertail P, Chautru E, Papa G (2019) Optimal survey schemes for stochastic gradient descent with applications to m-estimation. ESAIM Prob Stat 23:310\u2013337","journal-title":"ESAIM Prob Stat"},{"issue":"4","key":"1319_CR10","doi-asserted-by":"publisher","first-page":"495","DOI":"10.1080\/00401706.1980.10486199","volume":"22","author":"RD Cook","year":"1980","unstructured":"Cook RD, Weisberg S (1980) Characterizations of an empirical influence function for detecting influential cases in regression. Technometrics 22(4):495\u2013508","journal-title":"Technometrics"},{"key":"1319_CR11","unstructured":"Davison AC (2003a) Likelihood. Cambridge Series in Statistical and Probabilistic Mathematics. Cambridge University Press, pp 94\u2013160"},{"key":"1319_CR12","doi-asserted-by":"crossref","unstructured":"Davison AC (2003b) Nonlinear regression models. Cambridge Series in Statistical and Probabilistic Mathematics. Cambridge University Press, pp 468\u2013564","DOI":"10.1017\/CBO9780511815850.011"},{"issue":"2","key":"1319_CR13","doi-asserted-by":"publisher","first-page":"219","DOI":"10.1007\/s00211-010-0331-6","volume":"117","author":"P Drineas","year":"2011","unstructured":"Drineas P, Mahoney MW, Muthukrishnan S, Sarl\u00f3s T (2011) Faster least squares approximation. Numer Math 117(2):219\u2013249","journal-title":"Numer Math"},{"issue":"1","key":"1319_CR14","first-page":"2","volume":"3","author":"J Elseberg","year":"2012","unstructured":"Elseberg J, Magnenat S, Siegwart R, N\u00fcchter A (2012) Comparison of nearest-neighbor-search strategies and implementations for efficient shape registration. J Softw Eng Robot (JOSER) 3(1):2\u201312","journal-title":"J Softw Eng Robot (JOSER)"},{"issue":"5","key":"1319_CR15","doi-asserted-by":"publisher","first-page":"1724","DOI":"10.1214\/14-AOS1220","volume":"42","author":"W Fithian","year":"2014","unstructured":"Fithian W, Hastie T (2014) Local case-control sampling: efficient subsampling in imbalanced data sets. Ann Stat 42(5):1724\u20131963","journal-title":"Ann Stat"},{"key":"1319_CR16","doi-asserted-by":"crossref","unstructured":"Gama J, Rocha R, Medas P (2003) Accurate decision trees for mining high-speed data streams. In: Proceedings of the ninth ACM SIGKDD international conference on knowledge discovery and data mining, KDD \u201903, New York, pp 523\u2013528. Association for Computing Machinery","DOI":"10.1145\/956804.956813"},{"issue":"3","key":"1319_CR17","doi-asserted-by":"publisher","first-page":"1770","DOI":"10.1214\/19-AOS1867","volume":"48","author":"L Han","year":"2020","unstructured":"Han L, Yang T, Zhang T (2020) Local uncertainty sampling for large-scale multi-class logistic regression. Ann Stat 48(3):1770\u20131788","journal-title":"Ann Stat"},{"issue":"3","key":"1319_CR18","doi-asserted-by":"publisher","first-page":"943","DOI":"10.1007\/s00362-021-01263-y","volume":"63","author":"JL Kirkby","year":"2022","unstructured":"Kirkby JL, Nguyen DH, Nguyen D, Nguyen NN (2022) Inversion-free subsampling Newton\u2019s method for large sample logistic regression. Stat Pap 63(3):943\u2013963","journal-title":"Stat Pap"},{"issue":"1","key":"1319_CR21","doi-asserted-by":"publisher","first-page":"70","DOI":"10.1002\/wics.1324","volume":"7","author":"P Ma","year":"2015","unstructured":"Ma P, Sun X (2015) Leveraging for big data regression. Wiley Interdiscip Rev Comput Stat 7(1):70\u201376","journal-title":"Wiley Interdiscip Rev Comput Stat"},{"issue":"3","key":"1319_CR19","doi-asserted-by":"publisher","first-page":"631","DOI":"10.1093\/biomet\/asv009","volume":"102","author":"P Ma","year":"2015","unstructured":"Ma P, Huang JZ, Zhang N (2015a) Efficient computation of smoothing splines via adaptive basis sampling. Biometrika 102(3):631\u2013645","journal-title":"Biometrika"},{"issue":"1","key":"1319_CR20","first-page":"861","volume":"16","author":"P Ma","year":"2015","unstructured":"Ma P, Mahoney MW, Yu B (2015b) A statistical perspective on algorithmic leveraging. J Mach Learn Res 16(1):861\u2013911","journal-title":"J Mach Learn Res"},{"key":"1319_CR22","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4899-3242-6","volume-title":"Generalized linear models","author":"P McCullagh","year":"1989","unstructured":"McCullagh P, Nelder JA (1989) Generalized linear models, 2nd edn. Chapman & Hall, London","edition":"2"},{"issue":"3","key":"1319_CR23","doi-asserted-by":"publisher","first-page":"723","DOI":"10.1093\/biomet\/asaa019","volume":"107","author":"C Meng","year":"2020","unstructured":"Meng C, Zhang X, Zhang J, Zhong W, Ma P (2020) More efficient approximation of smoothing splines via space-filling basis selection. Biometrika 107(3):723\u2013735","journal-title":"Biometrika"},{"key":"1319_CR24","doi-asserted-by":"crossref","unstructured":"Oza NC, Russell S (2001) Experimental comparisons of online and batch versions of bagging and boosting. In: Proceedings of the seventh ACM SIGKDD international conference on knowledge discovery and data mining, KDD \u201901, New York. Association for Computing Machinery, pp 359\u2013364","DOI":"10.1145\/502512.502565"},{"issue":"4","key":"1319_CR25","doi-asserted-by":"publisher","first-page":"705","DOI":"10.1214\/aos\/1176345513","volume":"9","author":"D Pregibon","year":"1981","unstructured":"Pregibon D (1981) Logistic regression diagnostics. Ann Stat 9(4):705\u2013724","journal-title":"Ann Stat"},{"issue":"213","key":"1319_CR26","first-page":"1","volume":"17","author":"G Raskutti","year":"2016","unstructured":"Raskutti G, Mahoney MW (2016) A statistical perspective on randomized sketching for ordinary least-squares. J Mach Learn Res 17(213):1\u201331","journal-title":"J Mach Learn Res"},{"key":"1319_CR27","unstructured":"Settles B (2009) Active learning literature survey. Technical report, University of Wisconsin-Madison"},{"key":"1319_CR28","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1093\/biomet\/80.1.99","volume":"80","author":"R St Laurent","year":"1993","unstructured":"St Laurent R, Cook R (1993) Leverage, local influence and curvature in nonlinear regression. Biometrika 80:99\u2013106","journal-title":"Biometrika"},{"key":"1319_CR29","unstructured":"Ting D, Brochu E (2018) Optimal subsampling with influence functions. In: Proceedings of the 32nd international conference on neural information processing systems, pp 3654\u20133663"},{"issue":"132","key":"1319_CR30","first-page":"1","volume":"20","author":"H Wang","year":"2019","unstructured":"Wang H (2019) More efficient estimation for logistic regression with optimal subsamples. J Mach Learn Res 20(132):1\u201359","journal-title":"J Mach Learn Res"},{"key":"1319_CR31","unstructured":"Wang H (2020) Logistic regression for massive data with rare events. In: The 37st international conference on machine learning (ICML-2020). Accepted"},{"issue":"1","key":"1319_CR32","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1093\/biomet\/asaa043","volume":"108","author":"H Wang","year":"2020","unstructured":"Wang H, Ma Y (2020) Optimal subsampling for quantile regression in big data. Biometrika 108(1):99\u2013112","journal-title":"Biometrika"},{"issue":"522","key":"1319_CR34","doi-asserted-by":"publisher","first-page":"829","DOI":"10.1080\/01621459.2017.1292914","volume":"113","author":"H Wang","year":"2018","unstructured":"Wang H, Zhu R, Ma P (2018) Optimal subsampling for large sample logistic regression. J Am Stat Assoc 113(522):829\u2013844","journal-title":"J Am Stat Assoc"},{"issue":"525","key":"1319_CR33","doi-asserted-by":"publisher","first-page":"393","DOI":"10.1080\/01621459.2017.1408468","volume":"114","author":"H Wang","year":"2019","unstructured":"Wang H, Yang M, Stufken J (2019) Information-based optimal subdata selection for big data linear regression. J Am Stat Assoc 114(525):393\u2013405","journal-title":"J Am Stat Assoc"},{"issue":"3","key":"1319_CR35","doi-asserted-by":"publisher","first-page":"1273","DOI":"10.1214\/21-AOAS1462","volume":"15","author":"L Wang","year":"2021","unstructured":"Wang L, Elmstedt J, Wong WK, Xu H (2021) Orthogonal subsampling for big data linear regression. Ann Appl Stat 15(3):1273\u20131290","journal-title":"Ann Appl Stat"},{"issue":"1","key":"1319_CR36","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1111\/1467-9469.00086","volume":"25","author":"B-C Wei","year":"2001","unstructured":"Wei B-C, Hu Y-Q, Fung W-K (2001) Generalized leverage and its applications. Scand J Stat 25(1):25\u201337","journal-title":"Scand J Stat"},{"issue":"3","key":"1319_CR37","doi-asserted-by":"publisher","first-page":"991","DOI":"10.1214\/16-AOS1472","volume":"45","author":"Y Yang","year":"2017","unstructured":"Yang Y, Pilanci M, Wainwright M (2017) Randomized sketches for kernels: Fast and optimal non-parametric regression. Ann Stat 45(3):991\u20131023","journal-title":"Ann Stat"},{"issue":"1","key":"1319_CR38","doi-asserted-by":"publisher","first-page":"585","DOI":"10.1007\/s00362-018-01068-6","volume":"60","author":"Y Yao","year":"2019","unstructured":"Yao Y, Wang H (2019) Optimal subsampling for softmax regression. Stat Pap 60(1):585\u2013599","journal-title":"Stat Pap"}],"container-title":["Computational Statistics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00180-022-01319-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00180-022-01319-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00180-022-01319-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,14]],"date-time":"2024-03-14T09:08:26Z","timestamp":1710407306000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00180-022-01319-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,12,30]]},"references-count":38,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2024,4]]}},"alternative-id":["1319"],"URL":"https:\/\/doi.org\/10.1007\/s00180-022-01319-z","relation":{},"ISSN":["0943-4062","1613-9658"],"issn-type":[{"type":"print","value":"0943-4062"},{"type":"electronic","value":"1613-9658"}],"subject":[],"published":{"date-parts":[[2022,12,30]]},"assertion":[{"value":"11 May 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 December 2022","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 December 2022","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}