{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,10]],"date-time":"2026-05-10T10:20:21Z","timestamp":1778408421779,"version":"3.51.4"},"publisher-location":"Cham","reference-count":42,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783319306704","type":"print"},{"value":"9783319306711","type":"electronic"}],"license":[{"start":{"date-parts":[[2016,1,1]],"date-time":"2016-01-01T00:00:00Z","timestamp":1451606400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016]]},"DOI":"10.1007\/978-3-319-30671-1_4","type":"book-chapter","created":{"date-parts":[[2016,3,9]],"date-time":"2016-03-09T16:39:50Z","timestamp":1457541590000},"page":"45-57","source":"Crossref","is-referenced-by-count":325,"title":["Deep Learning over Multi-field Categorical Data"],"prefix":"10.1007","author":[{"given":"Weinan","family":"Zhang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tianming","family":"Du","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jun","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"key":"4_CR1","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"584","DOI":"10.1007\/3-540-45108-0_62","volume-title":"Intelligent Tutoring Systems","author":"JE Beck","year":"2000","unstructured":"Beck, J.E., Park Woolf, B.: High-level student modeling with machine learning. In: Gauthier, G., VanLehn, K., Frasson, C. (eds.) ITS 2000. LNCS, vol. 1839, pp. 584\u2013593. Springer, Heidelberg (2000)"},{"issue":"1","key":"4_CR2","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1561\/2200000006","volume":"2","author":"Y Bengio","year":"2009","unstructured":"Bengio, Y.: Learning deep architectures for AI. Found. Trends Mach. Learn. 2(1), 1\u2013127 (2009)","journal-title":"Found. Trends Mach. Learn."},{"key":"4_CR3","doi-asserted-by":"crossref","unstructured":"Bengio, Y., Lamblin, P., Popovici, D., Larochelle, H., et al.: Greedy layer-wise training of deep networks. In: NIPS, vol. 19, p. 153 (2007)","DOI":"10.7551\/mitpress\/7503.003.0024"},{"key":"4_CR4","unstructured":"Bengio, Y., Yao, L., Alain, G., Vincent, P.: Generalized denoising auto-encoders as generative models. In: NIPS, pp. 899\u2013907 (2013)"},{"issue":"2","key":"4_CR5","first-page":"123","volume":"24","author":"L Breiman","year":"1996","unstructured":"Breiman, L.: Bagging predictors. Mach. Learn. 24(2), 123\u2013140 (1996)","journal-title":"Mach. Learn."},{"key":"4_CR6","unstructured":"Broder, A.Z.: Computational advertising. In: SODA, vol. 8, pp. 992\u2013992 (2008)"},{"key":"4_CR7","first-page":"2493","volume":"12","author":"R Collobert","year":"2011","unstructured":"Collobert, R., Weston, J., Bottou, L., Karlen, M., Kavukcuoglu, K., Kuksa, P.: Natural language processing (almost) from scratch. JMLR 12, 2493\u20132537 (2011)","journal-title":"JMLR"},{"key":"4_CR8","doi-asserted-by":"crossref","unstructured":"Deng, L., Abdel-Hamid, O., Yu, D.: A deep convolutional neural network using heterogeneous pooling for trading acoustic invariance with phonetic confusion. In: ICASSP, pp. 6669\u20136673. IEEE (2013)","DOI":"10.1109\/ICASSP.2013.6638952"},{"issue":"05n06","key":"4_CR9","doi-asserted-by":"publisher","first-page":"535","DOI":"10.1142\/S0129065797000513","volume":"8","author":"D Elizondo","year":"1997","unstructured":"Elizondo, D., Fiesler, E.: A survey of partially connected neural networks. Int. J. Neural Syst. 8(05n06), 535\u2013558 (1997)","journal-title":"Int. J. Neural Syst."},{"key":"4_CR10","first-page":"625","volume":"11","author":"D Erhan","year":"2010","unstructured":"Erhan, D., Bengio, Y., Courville, A., Manzagol, P.A., Vincent, P., Bengio, S.: Why does unsupervised pre-training help deep learning? JMLR 11, 625\u2013660 (2010)","journal-title":"JMLR"},{"issue":"4","key":"4_CR11","doi-asserted-by":"publisher","first-page":"193","DOI":"10.1007\/BF00344251","volume":"36","author":"K Fukushima","year":"1980","unstructured":"Fukushima, K.: Neocognitron: a self-organizing neural network model for a mechanism of pattern recognition unaffected by shift in position. Biol. Cybern. 36(4), 193\u2013202 (1980)","journal-title":"Biol. Cybern."},{"key":"4_CR12","unstructured":"Graepel, T., Candela, J.Q., Borchert, T., Herbrich, R.: Web-scale bayesian click-through rate prediction for sponsored search advertising in microsoft\u2019s bing search engine. In: ICML, pp. 13\u201320 (2010)"},{"key":"4_CR13","doi-asserted-by":"crossref","unstructured":"Graves, A., Mohamed, A., Hinton, G.: Speech recognition with deep recurrent neural networks. In: ICASSP, pp. 6645\u20136649. IEEE (2013)","DOI":"10.1109\/ICASSP.2013.6638947"},{"issue":"3","key":"4_CR14","first-page":"385","volume":"69","author":"DJ Hand","year":"2001","unstructured":"Hand, D.J., Yu, K.: Idiot\u2019s bayes not so stupid after all? Int. Statist. Rev. 69(3), 385\u2013398 (2001)","journal-title":"Int. Statist. Rev."},{"key":"4_CR15","doi-asserted-by":"crossref","unstructured":"He, X., Pan, J., Jin, O., Xu, T., Liu, B., Xu, T., Shi, Y., Atallah, A., Herbrich, R., Bowers, S., et al.: Practical lessons from predicting clicks on ads at facebook. In: ADKDD, pp. 1\u20139. ACM (2014)","DOI":"10.1145\/2648584.2648589"},{"issue":"1","key":"4_CR16","first-page":"926","volume":"9","author":"G Hinton","year":"2010","unstructured":"Hinton, G.: A practical guide to training restricted boltzmann machines. Momentum 9(1), 926 (2010)","journal-title":"Momentum"},{"issue":"8","key":"4_CR17","doi-asserted-by":"publisher","first-page":"1771","DOI":"10.1162\/089976602760128018","volume":"14","author":"GE Hinton","year":"2002","unstructured":"Hinton, G.E.: Training products of experts by minimizing contrastive divergence. Neural comput. 14(8), 1771\u20131800 (2002)","journal-title":"Neural comput."},{"issue":"5786","key":"4_CR18","doi-asserted-by":"publisher","first-page":"504","DOI":"10.1126\/science.1127647","volume":"313","author":"GE Hinton","year":"2006","unstructured":"Hinton, G.E., Salakhutdinov, R.R.: Reducing the dimensionality of data with neural networks. Science 313(5786), 504\u2013507 (2006)","journal-title":"Science"},{"key":"4_CR19","doi-asserted-by":"crossref","unstructured":"Huang, P.S., He, X., Gao, J., Deng, L., Acero, A., Heck, L.: Learning deep structured semantic models for web search using clickthrough data. In: CIKM, pp. 2333\u20132338 (2013)","DOI":"10.1145\/2505515.2505665"},{"key":"4_CR20","unstructured":"Juan, Y.C., Zhuang, Y., Chin, W.S.: 3 idiots approach for display advertising challenge. In: Internet and Network Economics, pp. 254\u2013265. Springer, Heidelberg (2011)"},{"issue":"3","key":"4_CR21","doi-asserted-by":"publisher","first-page":"226","DOI":"10.1109\/34.667881","volume":"20","author":"J Kittler","year":"1998","unstructured":"Kittler, J., Hatef, M., Duin, R.P., Matas, J.: On combining classifiers. PAMI 20(3), 226\u2013239 (1998)","journal-title":"PAMI"},{"key":"4_CR22","unstructured":"Krizhevsky, A., Sutskever, I., Hinton, G.E.: Imagenet classification with deep convolutional neural networks. In: NIPS (2012)"},{"key":"4_CR23","doi-asserted-by":"crossref","unstructured":"Kurashima, T., Iwata, T., Takaya, N., Sawada, H.: Probabilistic latent network visualization: inferring and embedding diffusion networks. In: KDD, pp. 1236\u20131245. ACM (2014)","DOI":"10.1145\/2623330.2623646"},{"key":"4_CR24","first-page":"1","volume":"10","author":"H Larochelle","year":"2009","unstructured":"Larochelle, H., Bengio, Y., Louradour, J., Lamblin, P.: Exploring strategies for training deep neural networks. JMLR 10, 1\u201340 (2009)","journal-title":"JMLR"},{"issue":"7553","key":"4_CR25","doi-asserted-by":"crossref","first-page":"436","DOI":"10.1038\/nature14539","volume":"521","author":"Yann LeCun","year":"2015","unstructured":"LeCun, Y., Bengio, Y., Hinton, G.: Deep learning. Nature 521(7553) (2015)","journal-title":"Nature"},{"key":"4_CR26","doi-asserted-by":"crossref","unstructured":"Lee, K., Orten, B., Dasdan, A., Li, W.: Estimating conversion rate in display advertising from past performance data. In: KDD, pp. 768\u2013776. ACM (2012)","DOI":"10.1145\/2339530.2339651"},{"key":"4_CR27","doi-asserted-by":"crossref","unstructured":"Liao, H., Peng, L., Liu, Z., Shen, X.: ipinyou global rtb bidding algorithm competition dataset. In: ADKDD, pp. 1\u20136. ACM (2014)","DOI":"10.1145\/2648584.2648590"},{"key":"4_CR28","doi-asserted-by":"crossref","unstructured":"McMahan, H.B., Holt, G., Sculley, D., Young, M., Ebner, D., Grady, J., Nie, L., Phillips, T., Davydov, E., Golovin, D., et al.: Ad click prediction: a view from the trenches. In: KDD, pp. 1222\u20131230. ACM (2013)","DOI":"10.1145\/2487575.2488200"},{"key":"4_CR29","doi-asserted-by":"crossref","unstructured":"Oentaryo, R.J., Lim, E.P., Low, D.J.W., Lo, D., Finegold, M.: Predicting response in mobile advertising with hierarchical importance-aware factorization machine. In: WSDM (2014)","DOI":"10.1145\/2556195.2556240"},{"issue":"4","key":"4_CR30","doi-asserted-by":"publisher","first-page":"761","DOI":"10.1016\/S0893-6080(98)00010-0","volume":"11","author":"L Prechelt","year":"1998","unstructured":"Prechelt, L.: Automatic early stopping using cross validation: quantifying the criteria. Neural Netw. 11(4), 761\u2013767 (1998)","journal-title":"Neural Netw."},{"issue":"3","key":"4_CR31","first-page":"57","volume":"3","author":"S Rendle","year":"2012","unstructured":"Rendle, S.: Factorization machines with libfm. ACM TIST 3(3), 57 (2012)","journal-title":"ACM TIST"},{"key":"4_CR32","doi-asserted-by":"crossref","unstructured":"Richardson, M., Dominowska, E., Ragno, R.: Predicting clicks: estimating the click-through rate for new ads. In: WWW, pp. 521\u2013530. ACM (2007)","DOI":"10.1145\/1242572.1242643"},{"key":"4_CR33","doi-asserted-by":"crossref","unstructured":"Shen, Y., He, X., Gao, J., Deng, L., Mesnil, G.: A latent semantic model with convolutional-pooling structure for information retrieval. In: CIKM (2014)","DOI":"10.1145\/2661829.2661935"},{"key":"4_CR34","unstructured":"Snoek, J., Larochelle, H., Adams, R.P.: Practical bayesian optimization of machine learning algorithms. In: NIPS, pp. 2951\u20132959 (2012)"},{"issue":"1","key":"4_CR35","first-page":"1929","volume":"15","author":"N Srivastava","year":"2014","unstructured":"Srivastava, N., Hinton, G., Krizhevsky, A., Sutskever, I., Salakhutdinov, R.: Dropout: A simple way to prevent neural networks from overfitting. JMLR 15(1), 1929\u20131958 (2014)","journal-title":"JMLR"},{"key":"4_CR36","unstructured":"Sutskever, I., Martens, J., Dahl, G., Hinton, G.: On the importance of initialization and momentum in deep learning. In: ICML, pp. 1139\u20131147 (2013)"},{"key":"4_CR37","doi-asserted-by":"crossref","unstructured":"Tang, J., Qu, M., Wang, M., Zhang, M., Yan, J., Mei, Q.: Line: Large-scale information network embedding. In: WWW, pp. 1067\u20131077 (2015)","DOI":"10.1145\/2736277.2741093"},{"key":"4_CR38","doi-asserted-by":"crossref","unstructured":"Trofimov, I., Kornetova, A., Topinskiy, V.: Using boosted trees for click-through rate prediction for sponsored search. In: WINE, p. 2. ACM (2012)","DOI":"10.1145\/2351356.2351358"},{"key":"4_CR39","first-page":"1","volume-title":"Advances in Multimedia and Interactive Technologies","author":"Xuerui Wang","year":"2011","unstructured":"Wang, X., Li, W., Cui, Y., Zhang, R., Mao, J.: Click-through rate estimation for rare events in online advertising. In: Online Multimedia Advertising: Techniques and Technologies, pp. 1\u201312 (2010)"},{"key":"4_CR40","doi-asserted-by":"crossref","unstructured":"Zeiler, M.D., Taylor, G.W., Fergus, R.: Adaptive deconvolutional networks for mid and high level feature learning. In: ICCV, pp. 2018\u20132025. IEEE (2011)","DOI":"10.1109\/ICCV.2011.6126474"},{"key":"4_CR41","doi-asserted-by":"crossref","unstructured":"Zhang, W., Yuan, S., Wang, J.: Optimal real-time bidding for display advertising. In: KDD, pp. 1077\u20131086. ACM (2014)","DOI":"10.1145\/2623330.2623633"},{"issue":"13","key":"4_CR42","first-page":"1772","volume":"7","author":"Y Zou","year":"2014","unstructured":"Zou, Y., Jin, X., Li, Y., Guo, Z., Wang, E., Xiao, B.: Mariana: Tencent deep learning platform and its applications. VLDB 7(13), 1772\u20131777 (2014)","journal-title":"VLDB"}],"container-title":["Lecture Notes in Computer Science","Advances in Information Retrieval"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-30671-1_4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,17]],"date-time":"2023-08-17T05:17:20Z","timestamp":1692249440000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-30671-1_4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016]]},"ISBN":["9783319306704","9783319306711"],"references-count":42,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-30671-1_4","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2016]]}}}