{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T14:45:32Z","timestamp":1740149132574,"version":"3.37.3"},"reference-count":30,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2024,3,8]],"date-time":"2024-03-08T00:00:00Z","timestamp":1709856000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,3,8]],"date-time":"2024-03-08T00:00:00Z","timestamp":1709856000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"NSF Idaho EPSCoR Program","award":["OIA1757324"],"award-info":[{"award-number":["OIA1757324"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["42202333"],"award-info":[{"award-number":["42202333"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Earth Sci Inform"],"published-print":{"date-parts":[[2024,6]]},"DOI":"10.1007\/s12145-024-01268-9","type":"journal-article","created":{"date-parts":[[2024,3,8]],"date-time":"2024-03-08T11:01:38Z","timestamp":1709895698000},"page":"1983-1991","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["How does extreme point sampling affect non-extreme simulation in geographical random forest?"],"prefix":"10.1007","volume":"17","author":[{"given":"Hui","family":"Wang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Meixu","family":"Chen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhe","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Li","family":"Huang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Christopher C.","family":"Caudill","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shijin","family":"Qu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiang","family":"Que","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,3,8]]},"reference":[{"key":"1268_CR1","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1016\/j.isprsjprs.2016.01.011","volume":"114","author":"M Belgiu","year":"2016","unstructured":"Belgiu M, Dr\u0103gu\u0163 L (2016) Random forest in remote sensing: a review of applications and future directions. ISPRS J Photogrammetry Remote Sens 114:24\u201331","journal-title":"ISPRS J Photogrammetry Remote Sens"},{"key":"1268_CR2","unstructured":"Berry BJL, Marble DF (1968) Spatial analysis: a reader in statistical geography. Prentice-Hall"},{"issue":"3","key":"1268_CR3","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3381028","volume":"53","author":"A Boukerche","year":"2020","unstructured":"Boukerche A, Zheng L, Alfandi O (2020) Outlier detection: methods, models, and classification. ACM Comput Surv (CSUR) 53(3):1\u201337","journal-title":"ACM Comput Surv (CSUR)"},{"issue":"3","key":"1268_CR4","first-page":"431","volume":"47","author":"C Brunsdon","year":"1998","unstructured":"Brunsdon C, Fotheringham S, Charlton M (1998) Geographically weighted regression. J Royal Stat Society: Ser D 47(3):431\u2013443","journal-title":"J Royal Stat Society: Ser D"},{"issue":"1\u20132","key":"1268_CR5","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/S0016-7061(97)00072-4","volume":"80","author":"D Brus","year":"1997","unstructured":"Brus D, De Gruijter J (1997) Random sampling or geostatistical modelling? Choosing between design-based and model-based sampling strategies for soil (with discussion). Geoderma 80(1\u20132):1\u201344","journal-title":"Geoderma"},{"issue":"1","key":"1268_CR6","doi-asserted-by":"publisher","first-page":"127","DOI":"10.1007\/s10107-012-0572-5","volume":"134","author":"RH Byrd","year":"2012","unstructured":"Byrd RH, Chin GM, Nocedal J, Wu Y (2012) Sample size selection in optimization methods for machine learning. Math Program 134(1):127\u2013155","journal-title":"Math Program"},{"issue":"4","key":"1268_CR7","doi-asserted-by":"publisher","first-page":"488","DOI":"10.1214\/aoms\/1177729747","volume":"21","author":"WJ Dixon","year":"1950","unstructured":"Dixon WJ (1950) Analysis of extreme values. Ann Math Stat 21(4):488\u2013506","journal-title":"Ann Math Stat"},{"issue":"9","key":"1268_CR8","doi-asserted-by":"publisher","first-page":"2018","DOI":"10.1111\/2041-210X.13919","volume":"13","author":"M Dumelle","year":"2022","unstructured":"Dumelle M, Higham M, Ver Hoef JM, Olsen AR, Madsen L (2022) A comparison of design-based and model\u2010based approaches for finite population spatial sampling and inference. Methods Ecol Evol 13(9):2018\u20132029","journal-title":"Methods Ecol Evol"},{"issue":"4","key":"1268_CR9","first-page":"585","volume":"42","author":"R Dunn","year":"1993","unstructured":"Dunn R, Harrison A (1993) Two-dimensional systematic sampling of land use. J Royal Stat Society: Ser C 42(4):585\u2013601","journal-title":"J Royal Stat Society: Ser C"},{"issue":"1","key":"1268_CR10","doi-asserted-by":"publisher","first-page":"83","DOI":"10.3390\/rs5010083","volume":"5","author":"N Flood","year":"2013","unstructured":"Flood N, Danaher T, Gill T, Gillingham S (2013) An operational scheme for deriving standardised surface reflectance from Landsat TM\/ETM\u2009+\u2009and SPOT HRG imagery for Eastern Australia. Remote Sens 5(1):83\u2013109","journal-title":"Remote Sens"},{"issue":"2","key":"1268_CR11","doi-asserted-by":"publisher","first-page":"121","DOI":"10.1080\/10106049.2019.1595177","volume":"36","author":"S Georganos","year":"2021","unstructured":"Georganos S, Grippa T, Niang Gadiaga A, Linard C, Lennert M, Vanhuysse S, Kalogirou S (2021) Geographical random forests: a spatial extension of the random forest algorithm to address spatial heterogeneity in remote sensing and population modelling. Geocarto Int 36(2):121\u2013136","journal-title":"Geocarto Int"},{"key":"1268_CR12","doi-asserted-by":"publisher","first-page":"717","DOI":"10.1007\/s10798-012-9212-x","volume":"23","author":"SM G\u00f3mez Puente","year":"2013","unstructured":"G\u00f3mez Puente SM, Van Eijck M, Jochems W (2013) A sampled literature review of design-based learning approaches: a search for key characteristics. Int J Technol Des Educ 23:717\u2013732","journal-title":"Int J Technol Des Educ"},{"issue":"10","key":"1268_CR13","doi-asserted-by":"publisher","first-page":"1429","DOI":"10.1139\/x98-166","volume":"28","author":"TG Gregoire","year":"1998","unstructured":"Gregoire TG (1998) Design-based and model-based inference in survey sampling: appreciating the difference. Can J for Res 28(10):1429\u20131447","journal-title":"Can J for Res"},{"key":"1268_CR14","unstructured":"James R, Knaub J (1999) Model-based sampling, inference and imputation"},{"key":"1268_CR15","doi-asserted-by":"crossref","unstructured":"Kalogirou S, Georganos S (2018) Spatial Machine Learning (Version 0.1.3) [Package]","DOI":"10.32614\/CRAN.package.SpatialML"},{"issue":"4","key":"1268_CR16","doi-asserted-by":"publisher","first-page":"407","DOI":"10.4097\/kjae.2017.70.4.407","volume":"70","author":"SK Kwak","year":"2017","unstructured":"Kwak SK, Kim JH (2017) Statistical data preparation: management of missing values and outliers. Korean J Anesthesiology 70(4):407","journal-title":"Korean J Anesthesiology"},{"key":"1268_CR17","doi-asserted-by":"crossref","unstructured":"Masud MM, Gao J, Khan L, Han J, Thuraisingham B (2008) A practical approach to classify evolving data streams: Training with limited amount of labeled data Paper presented at the 2008 Eighth IEEE International Conference on Data Mining","DOI":"10.1109\/ICDM.2008.152"},{"issue":"7","key":"1268_CR18","doi-asserted-by":"publisher","first-page":"8489","DOI":"10.3390\/rs70708489","volume":"7","author":"K Millard","year":"2015","unstructured":"Millard K, Richardson M (2015) On the importance of training data sample selection in random forest image classification: a case study in peatland ecosystem mapping. Remote Sens 7(7):8489\u20138515","journal-title":"Remote Sens"},{"issue":"1","key":"1268_CR19","doi-asserted-by":"publisher","first-page":"169","DOI":"10.1016\/0034-4257(94)00073-V","volume":"51","author":"R Myneni","year":"1995","unstructured":"Myneni R, Maggion S, Iaquinta J, Privette J, Gobron N, Pinty B, Williams D (1995a) Optical remote sensing of vegetation: modeling, caveats, and algorithms. Remote Sens Environ 51(1):169\u2013188","journal-title":"Remote Sens Environ"},{"issue":"2","key":"1268_CR20","doi-asserted-by":"publisher","first-page":"481","DOI":"10.1109\/TGRS.1995.8746029","volume":"33","author":"RB Myneni","year":"1995","unstructured":"Myneni RB, Hall FG, Sellers PJ, Marshak AL (1995b) The interpretation of spectral vegetation indexes. IEEE Trans Geoscience Remote Sens 33(2):481\u2013486","journal-title":"IEEE Trans Geoscience Remote Sens"},{"issue":"2","key":"1268_CR21","doi-asserted-by":"publisher","first-page":"290","DOI":"10.1080\/15598608.2017.1353456","volume":"12","author":"A Sayed","year":"2018","unstructured":"Sayed A, Ibrahim A (2018) Recent developments in systematic sampling: a review. J Stat Theory Pract 12(2):290\u2013310","journal-title":"J Stat Theory Pract"},{"key":"1268_CR22","doi-asserted-by":"crossref","unstructured":"U\u00e7ar MK, Nour M, Sindi H, Polat K (2020) The effect of training and testing process on machine learning in biomedical datasets. Mathematical Problems in Engineering, 2020","DOI":"10.1155\/2020\/2836236"},{"issue":"11","key":"1268_CR23","doi-asserted-by":"publisher","first-page":"e0224365","DOI":"10.1371\/journal.pone.0224365","volume":"14","author":"A Vabalas","year":"2019","unstructured":"Vabalas A, Gowen E, Poliakoff E, Casson AJ (2019) Machine learning algorithm validation with a limited sample size. PLoS ONE 14(11):e0224365","journal-title":"PLoS ONE"},{"key":"1268_CR24","doi-asserted-by":"publisher","first-page":"103359","DOI":"10.1016\/j.earscirev.2020.103359","volume":"210","author":"AM-C Wadoux","year":"2020","unstructured":"Wadoux AM-C, Minasny B, McBratney AB (2020) Machine learning for digital soil mapping: applications, challenges and suggested solutions. Earth Sci Rev 210:103359","journal-title":"Earth Sci Rev"},{"issue":"1","key":"1268_CR28","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1111\/j.1467-9671.1997.tb00003.x","volume":"2","author":"J Wang","year":"1997","unstructured":"Wang J, Wise S, Haining R (1997) An integrated regionalization of earthquake, flood, and drought hazards in China. Trans GIS 2(1):25\u201344","journal-title":"Trans GIS"},{"issue":"4","key":"1268_CR27","doi-asserted-by":"publisher","first-page":"523","DOI":"10.1080\/13658810902873512","volume":"24","author":"J Wang","year":"2010","unstructured":"Wang J, Haining R, Cao Z (2010) Sample surveying to estimate the mean of a heterogeneous surface: reducing the error variance through zoning. Int J Geogr Inf Sci 24(4):523\u2013543","journal-title":"Int J Geogr Inf Sci"},{"key":"1268_CR26","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.spasta.2012.08.001","volume":"2","author":"J-F Wang","year":"2012","unstructured":"Wang J-F, Stein A, Gao B-B, Ge Y (2012) A review of spatial sampling. Spat Stat 2:1\u201314","journal-title":"Spat Stat"},{"key":"1268_CR25","doi-asserted-by":"publisher","first-page":"102353","DOI":"10.1016\/j.jag.2021.102353","volume":"101","author":"H Wang","year":"2021","unstructured":"Wang H, Seaborn T, Wang Z, Caudill CC, Link TE (2021) Modeling tree canopy height using machine learning over mixed vegetation landscapes. Int J Appl Earth Observation Geoinf 101:102353","journal-title":"Int J Appl Earth Observation Geoinf"},{"issue":"5","key":"1268_CR29","doi-asserted-by":"publisher","first-page":"575","DOI":"10.3390\/rs11050575","volume":"11","author":"A Zafari","year":"2019","unstructured":"Zafari A, Zurita-Milla R, Izquierdo-Verdiguier E (2019) Evaluating the performance of a random forest kernel for land cover classification. Remote Sens 11(5):575","journal-title":"Remote Sens"},{"key":"1268_CR30","doi-asserted-by":"publisher","first-page":"112723","DOI":"10.1016\/j.rse.2021.112723","volume":"267","author":"Y Zeng","year":"2021","unstructured":"Zeng Y, Hao D, Badgley G, Damm A, Rascher U, Ryu Y, Qiu H (2021) Estimating near-infrared reflectance of vegetation from hyperspectral data. Remote Sens Environ 267:112723","journal-title":"Remote Sens Environ"}],"container-title":["Earth Science Informatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s12145-024-01268-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s12145-024-01268-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s12145-024-01268-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,14]],"date-time":"2024-11-14T00:45:39Z","timestamp":1731545139000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s12145-024-01268-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,3,8]]},"references-count":30,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2024,6]]}},"alternative-id":["1268"],"URL":"https:\/\/doi.org\/10.1007\/s12145-024-01268-9","relation":{},"ISSN":["1865-0473","1865-0481"],"issn-type":[{"type":"print","value":"1865-0473"},{"type":"electronic","value":"1865-0481"}],"subject":[],"published":{"date-parts":[[2024,3,8]]},"assertion":[{"value":"24 November 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 March 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 March 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}