{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,5]],"date-time":"2026-02-05T20:44:28Z","timestamp":1770324268523,"version":"3.49.0"},"reference-count":126,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2020,4,1]],"date-time":"2020-04-01T00:00:00Z","timestamp":1585699200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,4,1]],"date-time":"2020-04-01T00:00:00Z","timestamp":1585699200000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"name":"TATA Trust Grant to CMI","award":["NA"],"award-info":[{"award-number":["NA"]}]},{"name":"Commonwealth Fellowship","award":["RF 2017-123"],"award-info":[{"award-number":["RF 2017-123"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Comput Stat"],"published-print":{"date-parts":[[2020,9]]},"DOI":"10.1007\/s00180-020-00970-8","type":"journal-article","created":{"date-parts":[[2020,4,1]],"date-time":"2020-04-01T09:02:49Z","timestamp":1585731769000},"page":"893-930","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":21,"title":["A Bayesian perspective of statistical machine learning for big data"],"prefix":"10.1007","volume":"35","author":[{"given":"Rajiv","family":"Sambasivan","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5354-6520","authenticated-orcid":false,"given":"Sourish","family":"Das","sequence":"additional","affiliation":[]},{"given":"Sujit K.","family":"Sahu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,4,1]]},"reference":[{"key":"970_CR1","doi-asserted-by":"crossref","first-page":"87","DOI":"10.1016\/j.bdr.2015.04.001","volume":"2","author":"OY Al-Jarrah","year":"2015","unstructured":"Al-Jarrah OY, Yoo PD, Muhaidat S, Karagiannidis GK, Taha K (2015) Efficient machine learning for Big Data: a review. Big Data Res 2:87\u201393","journal-title":"Big Data Res"},{"key":"970_CR2","doi-asserted-by":"crossref","first-page":"5","DOI":"10.1023\/A:1020281327116","volume":"50","author":"C Andrieu","year":"2003","unstructured":"Andrieu C, De Freitas N, Doucet A, Jordan MI (2003) An introduction to MCMC for machine learning. Mach Learn 50:5\u201343","journal-title":"Mach Learn"},{"key":"970_CR3","series-title":"Springer series in statistics","volume-title":"Statistical decision theory and Bayesian analysis","author":"JO Berger","year":"1993","unstructured":"Berger JO (1993) Statistical decision theory and Bayesian analysis, 2nd edn. Springer series in statistics. Springer, New York","edition":"2"},{"key":"970_CR4","volume-title":"Sequential Analysis","author":"JO Berger","year":"2017","unstructured":"Berger JO (2017) Sequential Analysis, vol 1\u20133. Palgrave Macmillan UK, London"},{"key":"970_CR5","first-page":"281","volume":"13","author":"J Bergstra","year":"2012","unstructured":"Bergstra J, Bengio Y (2012) Random search for hyper-parameter optimization. J Mach Learn Res 13:281\u2013305","journal-title":"J Mach Learn Res"},{"key":"970_CR6","doi-asserted-by":"crossref","first-page":"813","DOI":"10.1214\/15-AOS1388","volume":"44","author":"D Bertsimas","year":"2016","unstructured":"Bertsimas D, King A, Mazumder R (2016) Best subset selection via a modern optimization lens. Ann Stat 44:813\u2013852","journal-title":"Ann Stat"},{"key":"970_CR7","doi-asserted-by":"crossref","first-page":"859","DOI":"10.1080\/01621459.2017.1285773","volume":"112","author":"DM Blei","year":"2017","unstructured":"Blei DM, Kucukelbir A, McAuliffe JD (2017) Variational inference: a review for statisticians. J Am Stat Assoc 112:859\u2013877","journal-title":"J Am Stat Assoc"},{"key":"970_CR8","doi-asserted-by":"crossref","first-page":"223","DOI":"10.1137\/16M1080173","volume":"60","author":"L Bottou","year":"2018","unstructured":"Bottou L, Curtis FE, Nocedal J (2018) Optimization methods for large-scale machine learning. SIAM Rev 60:223\u2013311","journal-title":"SIAM Rev"},{"key":"970_CR9","doi-asserted-by":"crossref","first-page":"169","DOI":"10.1007\/978-3-540-28650-9_8","volume-title":"Advanced lectures on machine learning","author":"O Bousquet","year":"2004","unstructured":"Bousquet O, Boucheron S, Lugosi G (2004) Introduction to statistical learning theory. Advanced lectures on machine learning. Springer, New York, pp 169\u2013207"},{"key":"970_CR10","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9780511804441","volume-title":"Convex optimization","author":"S Boyd","year":"2004","unstructured":"Boyd S, Vandenberghe L (2004) Convex optimization. Cambridge University Press, Cambridge"},{"key":"970_CR11","first-page":"123","volume":"24","author":"L Breiman","year":"1996","unstructured":"Breiman L (1996) Bagging predictors. Mach Learn 24:123\u2013140","journal-title":"Mach Learn"},{"key":"970_CR12","doi-asserted-by":"crossref","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman L (2001a) Random forests. Mach Learn 45:5\u201332","journal-title":"Mach Learn"},{"key":"970_CR13","doi-asserted-by":"crossref","first-page":"199","DOI":"10.1214\/ss\/1009213726","volume":"16","author":"L Breiman","year":"2001","unstructured":"Breiman L (2001b) Statistical modeling: the two cultures (with comments and a rejoinder by the author). Stat Sci 16:199\u2013231","journal-title":"Stat Sci"},{"key":"970_CR14","volume-title":"Classification and regression trees","author":"L Breiman","year":"1984","unstructured":"Breiman L, Friedman J, Stone CJ, Olshen RA (1984) Classification and regression trees. CRC Press, Boca Raton"},{"key":"970_CR15","unstructured":"Castro R (2018a) 2DI70 - Statistical learning theory, lecture notes. http:\/\/www.win.tue.nl\/~rmcastro\/2DI70\/files\/2DI70_Lecture_Notes.pdf. Accessed 8 Oct 2019"},{"key":"970_CR16","unstructured":"Castro R (2018b) ELEN6887: Complexity regularization and the squared loss. http:\/\/www.win.tue.nl\/~rmcastro\/6887_10\/files\/lecture11.pdf. Accessed 8 Oct 2019"},{"key":"970_CR17","volume-title":"Semi supervised learning","author":"O Chapelle","year":"2010","unstructured":"Chapelle O, Scholkopf B, Zien A (2010) Semi supervised learning, vol 1. The MIT Press, Cambridge"},{"key":"970_CR18","doi-asserted-by":"crossref","unstructured":"Chen T, Guestrin C (2016) XGBoost: a scalable tree boosting system. In: Proceedings of the 22nd ACM SIGKDD international conference on knowledge discovery and data mining. ACM, pp 785\u2013794","DOI":"10.1145\/2939672.2939785"},{"key":"970_CR19","doi-asserted-by":"crossref","unstructured":"Chen Z, Hruschka E, Liu B (2016) Lifelong machine learning and computer reading the web. In: Proceedings of the 22nd ACM SIGKDD international conference on knowledge discovery and data mining. ACM, pp 2117\u20132118","DOI":"10.1145\/2939672.2945381"},{"key":"970_CR20","unstructured":"Chipman HA, George EI, McCulloch RE (2006) Bayesian ensemble learning. In: Proceedings of the 19th international conference on neural information processing systems. NIPS\u201906. MIT Press, Cambridge, pp 265\u2013272"},{"key":"970_CR21","volume-title":"Introduction to algorithms","author":"TH Cormen","year":"2009","unstructured":"Cormen TH, Leiserson CE, Rivest RL, Stein C (2009) Introduction to algorithms, 3rd edn. McGraw-Hill, New York","edition":"3"},{"key":"970_CR22","first-page":"265","volume":"60","author":"S Das","year":"2006","unstructured":"Das S, Dey D (2006) On Bayesian analysis of generalized linear models using Jacobian technique. Am Stat 60:265\u2013268","journal-title":"Am Stat"},{"key":"970_CR23","doi-asserted-by":"crossref","first-page":"1492","DOI":"10.1016\/j.spl.2010.05.018","volume":"80","author":"S Das","year":"2010","unstructured":"Das S, Dey D (2010) On Bayesian inference for generalized multivariate gamma distribution. Stat Probab Lett 80:1492\u20131499","journal-title":"Stat Probab Lett"},{"key":"970_CR24","doi-asserted-by":"crossref","first-page":"407","DOI":"10.1007\/s11009-011-9255-6","volume":"15","author":"S Das","year":"2013","unstructured":"Das S, Dey D (2013) On dynamic generalized linear models with applications. Methodol Comput Appl Probab 15:407\u2013421","journal-title":"Methodol Comput Appl Probab"},{"key":"970_CR25","doi-asserted-by":"crossref","first-page":"12","DOI":"10.1016\/j.bdr.2018.06.002","volume":"14","author":"S Das","year":"2018","unstructured":"Das S, Roy S, Sambasivan R (2018) Fast gaussian process regression for big data. Big Data Res 14:12\u201326","journal-title":"Big Data Res"},{"key":"970_CR26","first-page":"2151","volume":"4","author":"S Das","year":"2012","unstructured":"Das S, Yang H, Banks D (2012) Synthetic priors that merge opinion from multiple experts. Stat Polit Policy 4:2151\u20137509","journal-title":"Stat Polit Policy"},{"key":"970_CR27","doi-asserted-by":"crossref","first-page":"107","DOI":"10.1145\/1327452.1327492","volume":"51","author":"J Dean","year":"2008","unstructured":"Dean J, Ghemawat S (2008) MapReduce: simplified data processing on large clusters. Commun ACM 51:107\u2013113","journal-title":"Commun ACM"},{"key":"970_CR28","unstructured":"Dheeru D, Karra Taniskidou E (2017) UCI machine learning repository, individual household electric power consumption data set. https:\/\/archive.ics.uci.edu\/ml\/machine-learning-databases\/00235\/. Accessed 8 Oct 2019"},{"key":"970_CR29","doi-asserted-by":"crossref","first-page":"78","DOI":"10.1145\/2347736.2347755","volume":"55","author":"P Domingos","year":"2012","unstructured":"Domingos P (2012) A few useful things to know about machine learning. Commun ACM 55:78\u201387","journal-title":"Commun ACM"},{"key":"970_CR30","unstructured":"Duvenaud D (2014) Automatic model construction with gaussian processes. University of Cambridge, Computational and Biological Learning Laboratory, PhD thesis"},{"key":"970_CR31","unstructured":"ForestScience (1998) Forest CoverType Dataset by Forest Science Department of Colorado State University. https:\/\/archive.ics.uci.edu\/ml\/datasets\/covertype Data downloaded from UCI Machine Learning Repository. Accessed 8 Oct 2019"},{"key":"970_CR32","doi-asserted-by":"crossref","unstructured":"Foroughi F, Luksch P (2018) Data science methodology for Cybersecurity Projects. ArXiv preprint arXiv:1803.04219","DOI":"10.5121\/csit.2018.80401"},{"key":"970_CR33","first-page":"3","volume":"29","author":"JH Friedman","year":"1998","unstructured":"Friedman JH (1998) Data mining and statistics: What\u2019s the connection? Comput Sci Stat 29:3\u20139","journal-title":"Comput Sci Stat"},{"key":"970_CR34","series-title":"Springer series in statistics","volume-title":"The elements of statistical learning","author":"J Friedman","year":"2009","unstructured":"Friedman J, Hastie T, Tibshirani R (2009) The elements of statistical learning, 2nd edn. Springer series in statistics. Springer, New York","edition":"2"},{"key":"970_CR35","unstructured":"Gammerman A, Vovk V, Vapnik V (1998) Learning by transduction. In: Proceedings of the Fourteenth conference on Uncertainty in artificial intelligence. Morgan Kaufmann Publishers Inc, Burlington, pp 148\u2013155"},{"key":"970_CR36","doi-asserted-by":"crossref","first-page":"501","DOI":"10.1111\/j.2517-6161.1994.tb01996.x","volume":"56","author":"AE Gelfand","year":"1994","unstructured":"Gelfand AE, Dey DK (1994) Bayesian model choice: asymptotics and exact calculations. J R Stat Soc Ser B (Methodological) 56:501\u2013514","journal-title":"J R Stat Soc Ser B (Methodological)"},{"key":"970_CR37","doi-asserted-by":"crossref","first-page":"398","DOI":"10.1080\/01621459.1990.10476213","volume":"85","author":"AE Gelfand","year":"1990","unstructured":"Gelfand AE, Smith AFM (1990) Sampling-based approaches to calculating marginal densities. J Am Stat Assoc 85:398\u2013409","journal-title":"J Am Stat Assoc"},{"key":"970_CR38","doi-asserted-by":"crossref","DOI":"10.1201\/b16018","volume-title":"Bayesian data analysis","author":"A Gelman","year":"2013","unstructured":"Gelman A, Carlin JB, Stern HS, Dunson DB, Vehtari A, Rubin DB (2013) Bayesian data analysis, 3rd edn. CRC Press, Boca Raton","edition":"3"},{"key":"970_CR39","doi-asserted-by":"crossref","unstructured":"Germain P, Lacasse A, Laviolette F, Marchand M (2009) PAC-Bayesian learning of linear classifiers. In: Proceedings of the 26th international conference on machine learning (ICML), pp 353\u2013360","DOI":"10.1145\/1553374.1553419"},{"key":"970_CR40","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1016\/j.jmp.2011.08.004","volume":"56","author":"SJ Gershman","year":"2012","unstructured":"Gershman SJ, Blei DM (2012) A tutorial on Bayesian nonparametric models. J Math Psychol 56:1\u201312","journal-title":"J Math Psychol"},{"key":"970_CR41","doi-asserted-by":"crossref","first-page":"359","DOI":"10.1561\/2200000049","volume":"8","author":"M Ghavamzadeh","year":"2015","unstructured":"Ghavamzadeh M, Mannor S, Pineau J, Tamar A (2015) Bayesian reinforcement learning: a survey. Found Trends Mach Learn 8:359\u2013483","journal-title":"Found Trends Mach Learn"},{"key":"970_CR42","doi-asserted-by":"crossref","DOI":"10.1017\/9781139029834","volume-title":"Fundamentals of nonparametric bayesian inference","author":"S Ghoshal","year":"2017","unstructured":"Ghoshal S, Vaart AVD (2017) Fundamentals of nonparametric bayesian inference. Cambridge University Press, Cambridge"},{"key":"970_CR43","unstructured":"Goodfellow I (2018) Practical methodology for deploying machine learning. https:\/\/www.youtube.com\/watch?v=NKiwFF_zBu4&t=1781s. Accessed 8 Oct 2019"},{"key":"970_CR44","unstructured":"Goodfellow I, Bengio Y, Courville A (2016) Deep learning. MIT Press http:\/\/www.deeplearningbook.org. Accessed 8 Oct 2019"},{"key":"970_CR45","unstructured":"Google Research (2019) Quantum Computing, Quantum Computing, Google Research. https:\/\/www.ibm.com\/quantum-computing\/learn\/what-is-quantum-computing\/. Accessed 8 Oct 2019"},{"key":"970_CR46","volume-title":"Machine learning: theory and applications","author":"V Govindaraju","year":"2013","unstructured":"Govindaraju V, Rao CR (2013) Machine learning: theory and applications. Elsevier, North Holland"},{"key":"970_CR47","doi-asserted-by":"crossref","unstructured":"Guillaumin M, Verbeek J, Schmid C (2010) Multimodal semi-supervised learning for image classification. In: 2010 IEEE computer society conference on computer vision and pattern recognition, CVPR 2010","DOI":"10.1109\/CVPR.2010.5540120"},{"key":"970_CR48","doi-asserted-by":"crossref","first-page":"78","DOI":"10.1016\/0890-5401(92)90010-D","volume":"100","author":"D Haussler","year":"1992","unstructured":"Haussler D (1992) Decision theoretic generalizations of the PAC model for neural net and other learning applications. Inf Comput 100:78\u2013150","journal-title":"Inf Comput"},{"key":"970_CR49","doi-asserted-by":"publisher","first-page":"e1002106","DOI":"10.1371\/journal.pbio.1002106","volume":"13","author":"M Head","year":"2015","unstructured":"Head M, Holman L, Lanfear R, Kahn A, Jennions M (2015) The extent and consequences of p-hacking in science. PLOS Biol 13:e1002106. https:\/\/doi.org\/10.1371\/journal.pbio.1002106","journal-title":"PLOS Biol"},{"key":"970_CR50","doi-asserted-by":"crossref","first-page":"55","DOI":"10.1080\/00401706.1970.10488634","volume":"12","author":"AE Hoerl","year":"1970","unstructured":"Hoerl AE, Kennard RW (1970) Ridge regression: biased estimation for nonorthogonal problems. Technometrics 12:55\u201367","journal-title":"Technometrics"},{"key":"970_CR51","doi-asserted-by":"crossref","first-page":"331","DOI":"10.1007\/978-3-662-43968-5_19","volume-title":"Interactive knowledge discovery and data mining in biomedical informatics","author":"A Holzinger","year":"2014","unstructured":"Holzinger A (2014) On topological data mining. Interactive knowledge discovery and data mining in biomedical informatics. Springer, New York, pp 331\u2013356"},{"key":"970_CR52","unstructured":"IBM Q (2019) Quantum computing. https:\/\/www.ibm.com\/quantum-computing\/learn\/what-is-quantum-computing\/. Accessed 8 Oct 2019"},{"key":"970_CR53","volume-title":"Data lake architecture: designing the data lake and avoiding the garbage dump","author":"B Inmon","year":"2016","unstructured":"Inmon B (2016) Data lake architecture: designing the data lake and avoiding the garbage dump. Technics Publications, New Jersy"},{"key":"970_CR54","doi-asserted-by":"crossref","first-page":"142","DOI":"10.1561\/2200000058","volume":"10","author":"P Jain","year":"2017","unstructured":"Jain P, Kar P (2017) Non-convex optimization for machine learning. Found Trends Mach Learn 10:142\u2013336","journal-title":"Found Trends Mach Learn"},{"key":"970_CR55","unstructured":"Joachims T (1999) Transductive inference for text classification using support vector machines. In: Proceedings of the 16th international conference on machine learning, ICML 99, pp 200\u2013209"},{"key":"970_CR56","unstructured":"Kadane JB, Wasilkowski GW (1983) Average case-complexity in computer science: a Bayesian view. Technical Report"},{"key":"970_CR57","doi-asserted-by":"crossref","first-page":"3724","DOI":"10.1109\/TSP.2018.2839583","volume":"66","author":"A Karbalayghareh","year":"2018","unstructured":"Karbalayghareh A, Qian X, Dougherty ER (2018) Optimal Bayesian transfer learning. IEEE Trans Signal Process 66:3724\u20133739","journal-title":"IEEE Trans Signal Process"},{"key":"970_CR58","unstructured":"Kendall A, Gal Y (2017) What uncertainties do we need in bayesian deep learning for computer vision? In: 31st conference on neural information processing systems, NIPS 2017"},{"key":"970_CR59","volume-title":"The data warehouse lifecycle toolkit: expert methods for designing, developing, and deploying data warehouses","author":"R Kimball","year":"2013","unstructured":"Kimball R (2013) The data warehouse lifecycle toolkit: expert methods for designing, developing, and deploying data warehouses, 3rd edn. Wiley, New York","edition":"3"},{"key":"970_CR60","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4614-6849-3","volume-title":"Applied predictive modeling","author":"M Kuhn","year":"2013","unstructured":"Kuhn M, Johnson K (2013) Applied predictive modeling. Springer, New York"},{"key":"970_CR61","volume-title":"Discovering knowledge in data: an introduction to data mining","author":"DT Larose","year":"2005","unstructured":"Larose DT (2005) Discovering knowledge in data: an introduction to data mining. Wiley, New Jersey"},{"key":"970_CR62","volume-title":"Data mining methods & models","author":"DT Larose","year":"2006","unstructured":"Larose DT (2006) Data mining methods & models. Wiley, New York"},{"key":"970_CR63","first-page":"1909","volume":"7","author":"P Laskov","year":"2006","unstructured":"Laskov P, Gehl C, Kr\u00fcger S, M\u00fcller K-R (2006) Incremental support vector learning: analysis, implementation and applications. J Mach Learn Res 7:1909\u20131936","journal-title":"J Mach Learn Res"},{"key":"970_CR64","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9781139924801","volume-title":"Mining of massive datasets","author":"J Leskovec","year":"2014","unstructured":"Leskovec J, Rajaraman A, Ullman JD (2014) Mining of massive datasets, 2nd edn. Cambridge University Press, Cambridge","edition":"2"},{"key":"970_CR65","doi-asserted-by":"crossref","first-page":"7776","DOI":"10.1109\/ACCESS.2017.2696365","volume":"5","author":"A \u0139heureux","year":"2017","unstructured":"\u0139heureux A, Grolinger K, Elyamany HF, Capretz MA (2017) Machine learning with big data: challenges and approaches. IEEE Access 5:7776\u20137797","journal-title":"IEEE Access"},{"key":"970_CR66","first-page":"151","volume":"5","author":"Q Li","year":"2010","unstructured":"Li Q, Lin N (2010) The Bayesian elastic net. Bayesian Anal 5:151\u2013170","journal-title":"Bayesian Anal"},{"key":"970_CR67","unstructured":"Lichman M (2016) UCI machine learning repository. https:\/\/archive.ics.uci.edu\/ml\/machine-learning-databases\/housing\/. Accessed 8 Oct 2019"},{"key":"970_CR68","doi-asserted-by":"crossref","unstructured":"Littman ML (1994) Markov games as a framework for multi-agent reinforcement learning. In: Proceedings of the eleventh international conference, Rutgers University, New Brunswick, NJ, July 10\u201313, pp 157\u2013163","DOI":"10.1016\/B978-1-55860-335-6.50027-1"},{"key":"970_CR69","doi-asserted-by":"crossref","first-page":"716","DOI":"10.14778\/2212351.2212354","volume":"5","author":"Y Low","year":"2012","unstructured":"Low Y, Bickson D, Gonzalez J, Guestrin C, Kyrola A, Hellerstein JM (2012) Distributed GraphLab: a framework for machine learning and data mining in the cloud. Proc VLDB Endow 5:716\u2013727","journal-title":"Proc VLDB Endow"},{"key":"970_CR70","doi-asserted-by":"crossref","first-page":"163","DOI":"10.1007\/s10107-010-0350-1","volume":"131","author":"Z Lu","year":"2012","unstructured":"Lu Z, Monteiro RD, Yuan M (2012) Convex optimization methods for dimension reduction and coefficient estimation in multivariate linear regression. Math Program 131:163\u2013194","journal-title":"Math Program"},{"key":"970_CR71","first-page":"363","volume-title":"On-line learning in neural networks","author":"O Manfred","year":"1999","unstructured":"Manfred O, Ole W (1999) A Bayesian approach to on-line learning. In: Saad D (ed) On-line learning in neural networks. Cambridge University Press, Cambridge, pp 363\u2013379"},{"key":"970_CR72","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4899-3242-6","volume-title":"Generalized linear models","author":"P McCullagh","year":"1989","unstructured":"McCullagh P, Nelder J (1989) Generalized linear models, 2nd edn. Chapman and Hall\/CRC, London","edition":"2"},{"key":"970_CR73","unstructured":"McKinsey (2018) How companies are using big data and analytics, McKinsey & Company. https:\/\/www.mckinsey.com\/business-functions\/mckinsey-analytics\/our-insights\/how-companies-are-using-big-data-and-analytics. Accessed 8 Oct 2019"},{"key":"970_CR74","unstructured":"Microsoft Research (2018) Microsoft Research Lab - Asia. https:\/\/www.microsoft.com\/en-us\/research\/lab\/microsoft-research-asia\/articles\/machine-learning-research-hotspots\/. Accessed 8 Oct 2019"},{"key":"970_CR75","volume-title":"The discipline of machine learning","author":"TM Mitchell","year":"2006","unstructured":"Mitchell TM (2006) The discipline of machine learning, vol 9. Carnegie Mellon University, School of Computer Science, Machine Learning Department, Carnegie Mellon"},{"key":"970_CR76","unstructured":"National Institute of Standards and Technology - US Department of Commerce (2018) NIST Big Data Interoperability Framework: Volume 1, Definitions. http:\/\/nvlpubs.nist.gov\/nistpubs\/SpecialPublications\/NIST.SP.1500-1.pdf"},{"key":"970_CR77","volume-title":"Numerical optimization","author":"J Nocedal","year":"2006","unstructured":"Nocedal J, Wright S (2006) Numerical optimization, 2nd edn. Springer, New York","edition":"2"},{"key":"970_CR78","unstructured":"Nowak R (2018) Statistical learning theory, Lecture 3. http:\/\/nowak.ece.wisc.edu\/SLT09\/lecture3.pdf. Accessed 8 Oct 2019"},{"key":"970_CR79","doi-asserted-by":"crossref","first-page":"681","DOI":"10.1198\/016214508000000337","volume":"103","author":"T Park","year":"2008","unstructured":"Park T, Casella G (2008) The Bayesian Lasso. J Am Stat Assoc 103:681\u2013686","journal-title":"J Am Stat Assoc"},{"key":"970_CR80","unstructured":"Park S, Choi S (2010) Hierarchical Gaussian process regression. In: ACML, pp 95\u2013110"},{"key":"970_CR81","unstructured":"Pechyony D (2009) Theory and practice of transductive learning. Computer Science Department, PhD thesis, Technion"},{"key":"970_CR82","unstructured":"Pentina A, Lampert CH (2014) A PAC-Bayesian bound for lifelong learning. In: Proceedings of the 31st international conference on machine learning. ICML 14, vol 32, pp 991\u2013999"},{"key":"970_CR83","doi-asserted-by":"crossref","unstructured":"Poupart P, Vlassis N, Hoey J, Regan K (2006) An analytic solution to discrete Bayesian reinforcement learning. In: Proceedings of the 23rd international conference on Machine learning, ICML 06, pp 697\u2013704","DOI":"10.1145\/1143844.1143932"},{"key":"970_CR84","first-page":"204","volume":"5","author":"LY Pratt","year":"1992","unstructured":"Pratt LY (1992) Discriminability-based transfer between neural networks. Adv Neural Inf Process Syst 5:204\u2013211","journal-title":"Adv Neural Inf Process Syst"},{"key":"970_CR85","doi-asserted-by":"crossref","first-page":"67","DOI":"10.1186\/s13634-016-0355-x","volume":"2016","author":"J Qiu","year":"2016","unstructured":"Qiu J, Wu Q, Ding G, Xu Y, Feng S (2016) A survey of machine learning for big data processing. EURASIP J Adv Signal Process 2016:67","journal-title":"EURASIP J Adv Signal Process"},{"key":"970_CR86","doi-asserted-by":"crossref","first-page":"1297","DOI":"10.1109\/TPAMI.2014.2362751","volume":"37","author":"N Quadrianto","year":"2015","unstructured":"Quadrianto N, Ghahramani Z (2015) A very simple safe-bayesian random forest. IEEE Trans Pattern Anal Mach Intell 37:1297\u20131303","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"970_CR87","unstructured":"Rajaratnam B, Sparks D (2015) MCMC-based inference in the era of big data: a fundamental analysis of the convergence complexity of high-dimensional chains. https:\/\/arxiv.org\/abs\/1508.00947"},{"key":"970_CR88","volume-title":"Gaussian processes for machine learning","author":"CE Rasmussen","year":"2006","unstructured":"Rasmussen CE, Williams C (2006) Gaussian processes for machine learning. MIT Press, Cambridge"},{"key":"970_CR89","unstructured":"Ravi Kumar P (2014) Statistical machine learning and Big-p, Big-n, complex Data. http:\/\/uwtv.org\/series\/computer-science-engineering-lecture-series-2013\/watch\/IxNky5abdL8\/. Accessed 8 Oct 2019"},{"key":"970_CR90","doi-asserted-by":"crossref","unstructured":"Sambasivan R, Das S (2017a) Big data regression using tree based segmentation. In: Proceedings of INDICON, IEEE","DOI":"10.1109\/INDICON.2017.8488137"},{"key":"970_CR91","doi-asserted-by":"crossref","unstructured":"Sambasivan R, Das S (2017b) A statistical machine learning approach to yield curve forecasting. In: Proceedings of the international conference on computational intelligence in data science, IEEE","DOI":"10.1109\/ICCIDS.2017.8272667"},{"key":"970_CR92","doi-asserted-by":"crossref","first-page":"1","DOI":"10.2200\/S00429ED1V01Y201207AIM018","volume":"6","author":"B Settles","year":"2012","unstructured":"Settles B (2012) Active learning. Synth Lect Artif Intell Mach Learn 6:1\u2013114","journal-title":"Synth Lect Artif Intell Mach Learn"},{"key":"970_CR93","unstructured":"Shalev-Shwartz S (2007) Online learning: theory, algorithms, and applications, PhD thesis, Hebrew University"},{"key":"970_CR94","unstructured":"Shalev-Shwartz S, Singer Y (2008) Tutorial on theory and applications of online learning, Tutorial ICML"},{"key":"970_CR95","unstructured":"Sharma R, Das S (2017) Regularization and variable selection with copula prior. Corespondence https:\/\/arxiv.org\/abs\/1709.05514"},{"key":"970_CR96","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9780511809682","volume-title":"Kernel methods for pattern analysis","author":"J Shawe-Taylor","year":"2004","unstructured":"Shawe-Taylor J, Cristianini N (2004) Kernel methods for pattern analysis. Cambridge University Press, Cambridge"},{"key":"970_CR97","unstructured":"Shinal J (2017) Google CEO Sundar PIchai: moving all directions at once. https:\/\/www.cnbc.com\/2017\/05\/18\/google-ceo-sundar-pichai-machine-learning-big-data.html. Accessed 8 Oct 2019"},{"key":"970_CR98","doi-asserted-by":"crossref","first-page":"289","DOI":"10.1214\/10-STS330","volume":"25","author":"G Shmueli","year":"2010","unstructured":"Shmueli G (2010) To explain or to predict? Stat Sci 25:289\u2013310","journal-title":"Stat Sci"},{"key":"970_CR99","unstructured":"Silver DL, Yang Q, Li L (2013) Lifelong machine learning systems: beyond learning algorithms. In: AAAI Spring Symposium: Lifelong Machine Learning, vol 13, pp 05"},{"key":"970_CR100","unstructured":"Snell J, Swersky K, Zemel RS (2017) Prototypical networks for few-shot learning. In: Proceedings of the 31st conference on neural information processing systems, NIPS"},{"key":"970_CR101","first-page":"2951","volume":"25","author":"J Snoek","year":"2012","unstructured":"Snoek J, Larochelle H, Adams RP (2012) Practical bayesian optimization of machine learning algorithms. Adv Neural Inf Process Syst 25:2951\u20132959","journal-title":"Adv Neural Inf Process Syst"},{"key":"970_CR102","volume-title":"Introduction to reinforcement learning","author":"RS Sutton","year":"1998","unstructured":"Sutton RS, Barto AG (1998) Introduction to reinforcement learning, vol 135. MIT Press, Cambridge"},{"key":"970_CR103","unstructured":"Therneau T, Atkinson B, Ripley B (2017) rpart: Recursive Partitioning and Regression Trees R package version 4.1-11"},{"key":"970_CR104","doi-asserted-by":"crossref","first-page":"267","DOI":"10.1111\/j.2517-6161.1996.tb02080.x","volume":"58","author":"R Tibshirani","year":"1996","unstructured":"Tibshirani R (1996) Regression shrinkage and selection via the lasso. J R Stat Soc Ser B 58:267\u2013288","journal-title":"J R Stat Soc Ser B"},{"key":"970_CR105","unstructured":"Tibshirani R (2019) Lecture notes in statistical learning. http:\/\/statweb.stanford.edu\/~tibs\/stat315a\/glossary.pdf. Accessed 8 Oct 2019"},{"key":"970_CR106","doi-asserted-by":"crossref","first-page":"443","DOI":"10.1162\/089976699300016728","volume":"11","author":"ME Tipping","year":"1999","unstructured":"Tipping ME, Bishop CM (1999) Mixtures of probabilistic principal component analyzers. Neural Comput 11:443\u2013482","journal-title":"Neural Comput"},{"key":"970_CR107","volume-title":"Handbook of research on machine learning applications and trends: algorithms, methods, and techniques","author":"L Torrey","year":"2009","unstructured":"Torrey L, Shavlik J (2009) Transfer learning. In: Soria E, Martin J, Magdalena R, Martinez M, Serrano A (eds) Handbook of research on machine learning applications and trends: algorithms, methods, and techniques, vol 242. IGI Global, Pennsylvania"},{"key":"970_CR108","doi-asserted-by":"crossref","first-page":"2719","DOI":"10.1162\/089976600300014908","volume":"12","author":"V Tresp","year":"2000","unstructured":"Tresp V (2000) A Bayesian committee machine. Neural Comput 12:2719\u20132741","journal-title":"Neural Comput"},{"key":"970_CR109","unstructured":"UC Berkeley (2018) Statistical machine learning, Univ of California at Berkeley. https:\/\/www.stat.berkeley.edu\/~statlearning\/. Accessed 8 Oct 2019"},{"key":"970_CR110","doi-asserted-by":"crossref","first-page":"907","DOI":"10.1214\/aos\/1176347632","volume":"18","author":"S Van de Geer","year":"1990","unstructured":"Van de Geer S (1990) Estimating a regression function. Ann Stat 18:907\u2013924","journal-title":"Ann Stat"},{"key":"970_CR111","volume-title":"Statistical learning theory","author":"V Vapnik","year":"1998","unstructured":"Vapnik V (1998) Statistical learning theory. Wiley, New York"},{"key":"970_CR112","volume-title":"Reinforcement Learning. Adaptation, Learning, and Optimization","author":"N Vlassis","year":"2012","unstructured":"Vlassis N, Ghavamzadeh M, Mannor S, Poupart P (2012) Bayesian reinforcement learning. In: Wiering M, van Otterlo M (eds) Reinforcement Learning. Adaptation, Learning, and Optimization, vol 12. Springer, Berlin"},{"key":"970_CR113","series-title":"Springer Texts in Statistics","doi-asserted-by":"crossref","DOI":"10.1007\/978-0-387-21736-9","volume-title":"All of statistics: a concise course in statistical inference","author":"L Wasserman","year":"2004","unstructured":"Wasserman L (2004) All of statistics: a concise course in statistical inference. Springer Texts in Statistics. Springer, New York"},{"key":"970_CR114","unstructured":"Williams C (2015) AI guru Ng: fearing a rise of killer robots is like worrying about overpopulation on Mars. https:\/\/www.theregister.co.uk\/2015\/03\/19\/andrew_ng_baidu_ai\/. Accessed 8 Oct 2019"},{"key":"970_CR115","doi-asserted-by":"crossref","first-page":"241","DOI":"10.1016\/S0893-6080(05)80023-1","volume":"5","author":"DH Wolpert","year":"1992","unstructured":"Wolpert DH (1992) Stacked generalization. Neural Netw 5:241\u2013259","journal-title":"Neural Netw"},{"key":"970_CR116","doi-asserted-by":"crossref","first-page":"1341","DOI":"10.1162\/neco.1996.8.7.1341","volume":"8","author":"DH Wolpert","year":"1996","unstructured":"Wolpert DH (1996) The lack of a priori distinctions between learning algorithms. Neural Comput 8:1341\u20131390","journal-title":"Neural Comput"},{"key":"970_CR117","doi-asserted-by":"crossref","first-page":"67","DOI":"10.1109\/4235.585893","volume":"1","author":"DH Wolpert","year":"1997","unstructured":"Wolpert DH, Macready WG (1997) No free lunch theorems for optimization. IEEE Trans Evol Comput 1:67\u201382","journal-title":"IEEE Trans Evol Comput"},{"key":"970_CR118","doi-asserted-by":"crossref","first-page":"97","DOI":"10.1109\/TKDE.2013.109","volume":"26","author":"X Wu","year":"2014","unstructured":"Wu X, Zhu X, Wu G-Q, Ding W (2014) Data mining with big data. IEEE Trans Knowl Data Eng 26:97\u2013107","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"970_CR119","doi-asserted-by":"crossref","first-page":"304","DOI":"10.1109\/TKDE.2006.46","volume":"18","author":"H Xiong","year":"2006","unstructured":"Xiong H, Pandey G, Steinbach M, Kumar V (2006) Enhancing data analysis with noise removal. IEEE Trans Knowl Data Eng 18:304\u2013319","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"970_CR120","first-page":"652","volume":"43","author":"Y Yang","year":"2015","unstructured":"Yang Y, Tokdar ST et al (2015) Minimax-optimal nonparametric regression in high dimensions. Ann Stat 43:652\u2013674","journal-title":"Ann Stat"},{"key":"970_CR121","unstructured":"Yosinski J, Clune J, Bengio Y, Lipson H (2014) How transferable are features in deep neural networks? In: Proceedings of the 27th international conference on neural information processing systems, pp 3320\u20133328"},{"key":"970_CR122","doi-asserted-by":"crossref","first-page":"56","DOI":"10.1145\/2934664","volume":"59","author":"M Zaharia","year":"2016","unstructured":"Zaharia M, Xin RS, Wendell P, Das T, Armbrust M, Dave A, Meng X, Rosen J, Venkataraman S, Franklin MJ et al (2016) Apache spark: a unified engine for big data processing. Commun ACM 59:56\u201365","journal-title":"Commun ACM"},{"key":"970_CR123","doi-asserted-by":"crossref","unstructured":"Zhang T (2004) Solving large scale linear prediction problems using stochastic gradient descent algorithms. In: Proceedings of the twenty-first international conference on Machine learning, vol 116. ACM","DOI":"10.1145\/1015330.1015332"},{"key":"970_CR124","unstructured":"Zhiyuan Chen C, Hruschka E, Liu B (2016) KDD 2016 Tutorials - YouTube. http:\/\/www.youtube.com\/playlist?list=PLvM6T5w9YQBL6rP1-vGqhAa-SQ84KVv0c. Accessed 8 Oct 2019"},{"key":"970_CR125","doi-asserted-by":"crossref","first-page":"627","DOI":"10.1093\/nsr\/nwx044","volume":"4","author":"J Zhu","year":"2017","unstructured":"Zhu J, Chen J, Hu W, Zhang B (2017) Big learning with Bayesian methods. Natl Sci Rev 4:627\u2013651","journal-title":"Natl Sci Rev"},{"key":"970_CR126","doi-asserted-by":"crossref","first-page":"301","DOI":"10.1111\/j.1467-9868.2005.00503.x","volume":"67","author":"H Zou","year":"2005","unstructured":"Zou H, Hastie T (2005) Regularization and variable selection via the elastic net. J R Stat Soc Ser B 67:301\u2013320","journal-title":"J R Stat Soc Ser B"}],"container-title":["Computational Statistics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00180-020-00970-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s00180-020-00970-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00180-020-00970-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,3]],"date-time":"2024-08-03T06:29:10Z","timestamp":1722666550000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s00180-020-00970-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,4,1]]},"references-count":126,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2020,9]]}},"alternative-id":["970"],"URL":"https:\/\/doi.org\/10.1007\/s00180-020-00970-8","relation":{},"ISSN":["0943-4062","1613-9658"],"issn-type":[{"value":"0943-4062","type":"print"},{"value":"1613-9658","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,4,1]]},"assertion":[{"value":"17 December 2018","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 February 2020","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 April 2020","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}