{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,11]],"date-time":"2026-03-11T07:29:37Z","timestamp":1773214177797,"version":"3.50.1"},"reference-count":28,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,1,27]],"date-time":"2026-01-27T00:00:00Z","timestamp":1769472000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,27]],"date-time":"2026-01-27T00:00:00Z","timestamp":1769472000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Comput Stat"],"published-print":{"date-parts":[[2026,2]]},"DOI":"10.1007\/s00180-025-01702-6","type":"journal-article","created":{"date-parts":[[2026,1,27]],"date-time":"2026-01-27T13:44:09Z","timestamp":1769521449000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Refitted cross-validation estimation for high-dimensional subsamples from low-dimension full data"],"prefix":"10.1007","volume":"41","author":[{"given":"Haixiang","family":"Zhang","sequence":"first","affiliation":[]},{"given":"HaiYing","family":"Wang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,1,27]]},"reference":[{"key":"1702_CR1","doi-asserted-by":"publisher","first-page":"1348","DOI":"10.1198\/016214501753382273","volume":"96","author":"J Fan","year":"2001","unstructured":"Fan J, Li R (2001) Variable selection via nonconcave penalized likelihood and its oracle properties. J Am Stat Assoc 96:1348\u20131360","journal-title":"J Am Stat Assoc"},{"key":"1702_CR2","first-page":"1","volume":"22","author":"Z Fei","year":"2021","unstructured":"Fei Z, Li Y (2021) Estimation and inference for high dimensional generalized linear models: A splitting and smoothing approach. J Mach Learn Res 22:1\u201332","journal-title":"J Mach Learn Res"},{"key":"1702_CR3","doi-asserted-by":"publisher","first-page":"551","DOI":"10.1111\/biom.13013","volume":"75","author":"Z Fei","year":"2019","unstructured":"Fei Z, Zhu J, Banerjee M, Li Y (2019) Drawing inferences for high-dimensional linear models: A selection-assisted partial regression and smoothing approach. Biometrics 75:551\u2013561","journal-title":"Biometrics"},{"key":"1702_CR4","doi-asserted-by":"publisher","first-page":"898","DOI":"10.1080\/01621459.2021.1957900","volume":"118","author":"Z Fei","year":"2023","unstructured":"Fei Z, Zheng Q, Hong H, Li Y (2023) Inference for high-dimensional censored quantile regression. J Am Stat Assoc 118:898\u2013912","journal-title":"J Am Stat Assoc"},{"key":"1702_CR5","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1007\/s11425-022-2057-8","volume":"67","author":"J Gao","year":"2024","unstructured":"Gao J, Wang L, Lian H (2024) Optimal decorrelated score subsampling for generalized linear models with massive data. Science China Math 67:405\u2013430","journal-title":"Science China Math"},{"key":"1702_CR6","unstructured":"Han H, Fu L (2023) Optimal subsampling algorithm for the marginal model with large longitudinal data. arXiv:2311.08812v1"},{"key":"1702_CR7","doi-asserted-by":"publisher","first-page":"1770","DOI":"10.1214\/19-AOS1867","volume":"48","author":"L Han","year":"2020","unstructured":"Han L, Tan KM, Yang T, Zhang T (2020) Local uncertainty sampling for large-scale multiclass logistic regression. Ann Stat 48:1770\u20131788","journal-title":"Ann Stat"},{"key":"1702_CR8","doi-asserted-by":"publisher","first-page":"672","DOI":"10.1198\/016214508000000184","volume":"103","author":"BA Johnson","year":"2008","unstructured":"Johnson BA, Lin DY, Zeng D (2008) Penalized estimating functions and variable selection in semiparametric regression models. J Am Stat Assoc 103:672\u2013680","journal-title":"J Am Stat Assoc"},{"key":"1702_CR9","doi-asserted-by":"publisher","first-page":"2262","DOI":"10.1080\/01621459.2023.2209349","volume":"118","author":"N Keret","year":"2023","unstructured":"Keret N, Gorfine M (2023) Analyzing big EHR data-optimal cox regression subsampling procedure with rare events. J Am Stat Assoc 118:2262\u20132275","journal-title":"J Am Stat Assoc"},{"key":"1702_CR10","first-page":"861","volume":"16","author":"P Ma","year":"2015","unstructured":"Ma P, Mahoney MW, Yu B (2015) A statistical perspective on algorithmic leveraging. J Mach Learn Res 16:861\u2013911","journal-title":"J Mach Learn Res"},{"key":"1702_CR11","first-page":"1","volume":"20","author":"H Wang","year":"2019","unstructured":"Wang H (2019) More efficient estimation for logistic regression with optimal subsamples. J Mach Learn Res 20:1\u201359","journal-title":"J Mach Learn Res"},{"key":"1702_CR12","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1093\/biomet\/asaa043","volume":"108","author":"H Wang","year":"2021","unstructured":"Wang H, Ma Y (2021) Optimal subsampling for quantile regression in big data. Biometrika 108:99\u2013112","journal-title":"Biometrika"},{"key":"1702_CR13","doi-asserted-by":"publisher","first-page":"418","DOI":"10.1111\/stan.12266","volume":"76","author":"T Wang","year":"2022","unstructured":"Wang T, Zhang H (2022) Optimal subsampling for multiplicative regression with massive data. Stat Neerl 76:418\u2013449","journal-title":"Stat Neerl"},{"key":"1702_CR14","doi-asserted-by":"publisher","first-page":"829","DOI":"10.1080\/01621459.2017.1292914","volume":"113","author":"H Wang","year":"2018","unstructured":"Wang H, Zhu R, Ma P (2018) Optimal subsampling for large sample logistic regression. J Am Stat Assoc 113:829\u2013844","journal-title":"J Am Stat Assoc"},{"issue":"525","key":"1702_CR15","doi-asserted-by":"publisher","first-page":"393","DOI":"10.1080\/01621459.2017.1408468","volume":"114","author":"H Wang","year":"2019","unstructured":"Wang H, Yang M, Stufken J (2019) Information-based optimal subdata selection for big data linear regression. J Am Stat Assoc 114(525):393\u2013405","journal-title":"J Am Stat Assoc"},{"key":"1702_CR16","doi-asserted-by":"publisher","first-page":"6605","DOI":"10.1109\/TIT.2022.3176955","volume":"68","author":"J Wang","year":"2022","unstructured":"Wang J, Zou J, Wang H (2022) Sampling with replacement vs poisson sampling: a comparative study in optimal subsampling. IEEE Trans Inf Theory 68:6605\u20136630","journal-title":"IEEE Trans Inf Theory"},{"key":"1702_CR17","doi-asserted-by":"publisher","first-page":"98384","DOI":"10.52202\/079017-3122","volume":"37","author":"J Wang","year":"2024","unstructured":"Wang J, Wang H, Zhang H (2024) Scale-invariant optimal sampling for rare-events data and sparse models. Adv Neural Inf Process Syst 37:98384\u201398418","journal-title":"Adv Neural Inf Process Syst"},{"key":"1702_CR18","doi-asserted-by":"publisher","first-page":"5421","DOI":"10.1002\/sim.9576","volume":"41","author":"Z Yang","year":"2022","unstructured":"Yang Z, Wang H, Yan J (2022) Optimal subsampling for parametric accelerated failure time models with massive survival data. Stat Med 41:5421\u20135431","journal-title":"Stat Med"},{"key":"1702_CR19","doi-asserted-by":"publisher","DOI":"10.1007\/s11222-024-10391-y","author":"Z Yang","year":"2024","unstructured":"Yang Z, Wang H, Yan J (2024) Subsampling approach for least squares fitting of semi-parametric accelerated failure time models to massive survival data. Stat Comput. https:\/\/doi.org\/10.1007\/s11222-024-10391-y","journal-title":"Stat Comput"},{"key":"1702_CR20","doi-asserted-by":"publisher","first-page":"151","DOI":"10.6339\/21-JDS999","volume":"19","author":"Y Yao","year":"2021","unstructured":"Yao Y, Wang H (2021) A review on optimal subsampling methods for massive datasets. J Data Sci 19:151\u2013172","journal-title":"J Data Sci"},{"key":"1702_CR21","doi-asserted-by":"publisher","first-page":"265","DOI":"10.1080\/01621459.2020.1773832","volume":"117","author":"J Yu","year":"2022","unstructured":"Yu J, Wang H, Ai M, Zhang H (2022) Optimal distributed subsampling for maximum quasi-likelihood estimators with massive data. J Am Stat Assoc 117:265\u2013276","journal-title":"J Am Stat Assoc"},{"key":"1702_CR22","doi-asserted-by":"publisher","DOI":"10.1007\/s00362-022-01386-w","author":"J Yu","year":"2023","unstructured":"Yu J, Ai M, Ye Z (2023) A review on design inspired subsampling for big data. Stat Pap. https:\/\/doi.org\/10.1007\/s00362-022-01386-w","journal-title":"Stat Pap"},{"key":"1702_CR23","doi-asserted-by":"publisher","DOI":"10.1016\/j.csda.2020.107072","volume":"153","author":"H Zhang","year":"2021","unstructured":"Zhang H, Wang H (2021) Distributed subdata selection for big data via sampling-based approach. Comput Stat Data Anal 153:107072","journal-title":"Comput Stat Data Anal"},{"key":"1702_CR24","doi-asserted-by":"publisher","first-page":"106","DOI":"10.1080\/10618600.2020.1778483","volume":"30","author":"T Zhang","year":"2021","unstructured":"Zhang T, Ning Y, Ruppert D (2021) Optimal sampling for generalized linear models under measurement constraints. J Comput Graph Stat 30:106\u2013114","journal-title":"J Comput Graph Stat"},{"key":"1702_CR25","doi-asserted-by":"publisher","first-page":"276","DOI":"10.1080\/10618600.2023.2216261","volume":"33","author":"H Zhang","year":"2024","unstructured":"Zhang H, Zuo L, Wang H, Sun L (2024) Approximating partial likelihood estimators via optimal subsampling. J Comput Graph Stat 33:276\u2013288","journal-title":"J Comput Graph Stat"},{"key":"1702_CR26","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1515\/ijb-2024-0042","volume":"21","author":"H Zhang","year":"2025","unstructured":"Zhang H, Li Y, Wang H (2025) DsubCox: a fast subsampling algorithm for cox model with distributed and massive survival data. Int J Biostat 21:53\u201365","journal-title":"Int J Biostat"},{"key":"1702_CR27","doi-asserted-by":"publisher","first-page":"441","DOI":"10.1002\/sim.8783","volume":"40","author":"L Zuo","year":"2021","unstructured":"Zuo L, Zhang H, Wang H, Liu L (2021) Sampling-based estimation for massive survival data with additive hazards model. Stat Med 40:441\u2013450","journal-title":"Stat Med"},{"key":"1702_CR28","doi-asserted-by":"publisher","first-page":"2535","DOI":"10.1007\/s00180-021-01089-0","volume":"36","author":"L Zuo","year":"2021","unstructured":"Zuo L, Zhang H, Wang H, Sun L (2021) Optimal subsample selection for massive logistic regression with distributed data. Comput Stat 36:2535\u20132562","journal-title":"Comput Stat"}],"container-title":["Computational Statistics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00180-025-01702-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00180-025-01702-6","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00180-025-01702-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,10]],"date-time":"2026-03-10T09:39:40Z","timestamp":1773135580000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00180-025-01702-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,1,27]]},"references-count":28,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2026,2]]}},"alternative-id":["1702"],"URL":"https:\/\/doi.org\/10.1007\/s00180-025-01702-6","relation":{},"ISSN":["0943-4062","1613-9658"],"issn-type":[{"value":"0943-4062","type":"print"},{"value":"1613-9658","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,1,27]]},"assertion":[{"value":"21 September 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 September 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 January 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"38"}}