{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,29]],"date-time":"2025-09-29T08:13:13Z","timestamp":1759133593765},"reference-count":40,"publisher":"Springer Science and Business Media LLC","issue":"15","license":[{"start":{"date-parts":[[2016,2,23]],"date-time":"2016-02-23T00:00:00Z","timestamp":1456185600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2016,8]]},"DOI":"10.1007\/s11042-016-3294-5","type":"journal-article","created":{"date-parts":[[2016,2,23]],"date-time":"2016-02-23T08:26:44Z","timestamp":1456216004000},"page":"9169-9184","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["Multiple kernel visual-auditory representation learning for retrieval"],"prefix":"10.1007","volume":"75","author":[{"given":"Hong","family":"Zhang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wenping","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wenhe","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xin","family":"Xu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hehe","family":"Fan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2016,2,23]]},"reference":[{"key":"3294_CR1","unstructured":"Chang X, Yang Y, Hauptmann AG, Xing E, Yu Y (2015) Semantic concept discovery for large-scale zero-shot event detection. International Joint Conference on Artificial Intelligence, IJCAI"},{"key":"3294_CR2","unstructured":"Chang X, Yang Y, Xing E, Yu Y (2015) Complex event detection using semantic saliency and nearly-isotonic SVM. International Conference on Machine Learning (ICML)"},{"key":"3294_CR3","doi-asserted-by":"crossref","unstructured":"Chang X, Yu Y, Yang Y, Hauptmann A (2015) Searching persuasively: joint event detection and evidence justification with limited supervision. ACM MM","DOI":"10.1145\/2733373.2806218"},{"key":"3294_CR4","doi-asserted-by":"crossref","first-page":"47","DOI":"10.1016\/S0024-3795(99)00085-3","volume":"321","author":"DD Gao","year":"2000","unstructured":"Gao DD, Huang RB (2000) Some results on canonical correlation and their application to a linear model. Linear Algebra Appl 321:47\u201359","journal-title":"Linear Algebra Appl"},{"key":"3294_CR5","first-page":"2211","volume":"12","author":"M Gonen","year":"2011","unstructured":"Gonen M, Alpayd\u0131n E (2011) Multiple kernel learning algorithms. J Mach Learn Res 12:2211\u20132268","journal-title":"J Mach Learn Res"},{"key":"3294_CR6","first-page":"519","volume":"13","author":"P Jain","year":"2012","unstructured":"Jain P, Kulis B, Davis JV, Dhillon IS (2012) Metric and kernel learning using a linear transformation. J Mach Learn Res 13:519\u2013547","journal-title":"J Mach Learn Res"},{"key":"3294_CR7","doi-asserted-by":"crossref","unstructured":"Jain A, Vishwanathan SVN, Varma M (2012) Spg-gmkl: generalized multiple kernel learning with a million kernels. In: Proceedings of the ACM SIGKDD conference on knowledge discovery and data mining","DOI":"10.1145\/2339530.2339648"},{"key":"3294_CR8","first-page":"27","volume":"5","author":"GRG Lanckriet","year":"2004","unstructured":"Lanckriet GRG, Cristianini N, Bartlett P, Ghaoui LE, Jordan MI (2004) Learning the kernel matrix with semi-definite programming. J Mach Learn Res 5:27\u201372","journal-title":"J Mach Learn Res"},{"issue":"1","key":"3294_CR9","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/1126004.1126005","volume":"2","author":"MS Lew","year":"2006","unstructured":"Lew MS, Sebe N, Djeraba C, Jain R (2006) Content-based multimedia information retrieval: state of the art and challenges. ACM Trans Multimed Comput Commun Appl 2(1):1\u201319","journal-title":"ACM Trans Multimed Comput Commun Appl"},{"key":"3294_CR10","doi-asserted-by":"crossref","unstructured":"Liu Y, Wu F, Zhuang Y, Xiao J (2008) Active post-refined multimodality video semantic concept detection with tensor representation. ACM International Conference on Multimedia. pp.91\u2013100","DOI":"10.1145\/1459359.1459372"},{"key":"3294_CR11","doi-asserted-by":"crossref","unstructured":"Liu G, Yan Y, Gao C, Tong W, Hauptmann AG, Sebe N (2014) The mystery of faces: investigating face contribution for multimedia event detection. ICMR","DOI":"10.1145\/2578726.2578795"},{"issue":"4","key":"3294_CR12","doi-asserted-by":"crossref","first-page":"491","DOI":"10.1109\/TKDE.2005.66","volume":"17","author":"H Liu","year":"2005","unstructured":"Liu H, Yu L (2005) Toward integrating feature selection algorithms for classication and clustering. IEEE Trans Knowl Data Eng 17(4):491\u2013502","journal-title":"IEEE Trans Knowl Data Eng"},{"issue":"7","key":"3294_CR13","doi-asserted-by":"crossref","first-page":"659","DOI":"10.1016\/j.is.2005.12.004","volume":"31","author":"Q Ma","year":"2006","unstructured":"Ma Q, Akiyo N, Katsumi T (2006) Complementary information retrieval for cross-media news content. Inf Syst 31(7):659\u2013678","journal-title":"Inf Syst"},{"key":"3294_CR14","doi-asserted-by":"crossref","first-page":"1961","DOI":"10.1016\/S0031-3203(03)00058-X","volume":"36","author":"T Melzer","year":"2003","unstructured":"Melzer T, Reiter M, Bischof H (2003) Appearance models based on kernel canonical correlation analysis. Pattern Recogn 36:1961\u20131971","journal-title":"Pattern Recogn"},{"issue":"2","key":"3294_CR15","doi-asserted-by":"crossref","first-page":"523","DOI":"10.1007\/s11042-014-1936-z","volume":"74","author":"H Shen","year":"2015","unstructured":"Shen H, Yan Y, Xu S, Ballas N, Chen W (2015) Evaluation of semi-supervised learning method on action recognition. Multimedia Tools and Applications 74(2):523\u2013542","journal-title":"Multimedia Tools and Applications"},{"key":"3294_CR16","first-page":"1531","volume":"7","author":"S Sonnenburg","year":"2006","unstructured":"Sonnenburg S, R\u00e4tsch G, Schafer C, Scholkopf B (2006) Largescale multiple kernel learning. J Mach Learn Res 7:1531\u20131565","journal-title":"J Mach Learn Res"},{"key":"3294_CR17","doi-asserted-by":"crossref","first-page":"531","DOI":"10.1016\/j.imavis.2006.04.014","volume":"25","author":"T Sun","year":"2007","unstructured":"Sun T, Chen S (2007) Locality preserving CCA with applications to data visualization and pose estimation. Image Vis Comput 25:531\u2013543","journal-title":"Image Vis Comput"},{"issue":"2","key":"3294_CR18","first-page":"1","volume":"27","author":"M Thomas","year":"2003","unstructured":"Thomas M, Michael R, Horst B (2003) Appearance models based on kernel canonical correlation analysis. Pattern Recogn 27(2):1\u20138","journal-title":"Pattern Recogn"},{"key":"3294_CR19","doi-asserted-by":"crossref","first-page":"9","DOI":"10.1016\/j.cviu.2015.06.007","volume":"140","author":"G Tolias","year":"2015","unstructured":"Tolias G, Bursuc A, Furon T, J\u00e9gou H (2015) Rotation and translation covariant match kernels for image retrieval. Comp Vis Image Underst 140:9\u201320","journal-title":"Comp Vis Image Underst"},{"key":"3294_CR20","doi-asserted-by":"crossref","unstructured":"Tong S, Chang E (2001) Support vector machine active learning for image retrieval. ACM International Conference on Multimedia, pp. 107\u2013118","DOI":"10.1145\/500141.500159"},{"key":"3294_CR21","doi-asserted-by":"crossref","unstructured":"Vapnik V (1997) The nature of statistical learning theory. IEEE Trans Neural Netw 8(6)","DOI":"10.1109\/TNN.1997.641482"},{"key":"3294_CR22","doi-asserted-by":"crossref","unstructured":"Varma M, Babu BR (2009) More generality in efficient multiple kernel learning. In Proceedings of International Conference on Machine Learning, pp.1065\u20131072","DOI":"10.1145\/1553374.1553510"},{"key":"3294_CR23","unstructured":"Vishwanathan SVN, Sun Z, Ampornpunt N, Varma M (2010) Multiple kernel learning and the SMO algorithm. In: NIPS, pp. 2361\u20132369"},{"issue":"3","key":"3294_CR24","doi-asserted-by":"crossref","first-page":"550","DOI":"10.1109\/TPAMI.2013.145","volume":"36","author":"D Wang","year":"2014","unstructured":"Wang D, Hoi SC, He Y, Zhu J, Mei T, Luo J (2014) Retrieval-based face annotation by weak label regularized local coordinate coding. IEEE Trans Pattern Ana Mach Intell (TPAMI) 36(3):550\u2013563","journal-title":"IEEE Trans Pattern Ana Mach Intell (TPAMI)"},{"key":"3294_CR25","unstructured":"Wu Y, Chang EY, Chang CC, Kevin, Smith JR (2004) Optimal multimodal fusion for multi-media data analysis. In: ACM Multimedia Conference, pp. 572\u2013579"},{"key":"3294_CR26","doi-asserted-by":"crossref","unstructured":"Wu Y, Chang EY, Chen-Chuan Chang K, Smith JR (2004) Optimal multimodal fusion for multimedia data analysis. ACM International Conference on Multimedia, pp.572\u2013579","DOI":"10.1145\/1027527.1027665"},{"key":"3294_CR27","unstructured":"Xia H, Hoi SC, Jin R, Zhao P (2012) Online multiple kernel similarity learning for visual search. IEEE Transactions on Pattern Analysis and Machine Intelligence (TPAMI) 1(1)"},{"issue":"10","key":"3294_CR28","doi-asserted-by":"crossref","first-page":"2984","DOI":"10.1109\/TIP.2015.2438540","volume":"24","author":"Y Yan","year":"2015","unstructured":"Yan Y, Ricci E, Liu G, Sebe N (2015) Egocentric daily activity recognition via multitask clustering. IEEE Trans Image Process 24(10):2984\u20132995","journal-title":"IEEE Trans Image Process"},{"key":"3294_CR29","doi-asserted-by":"crossref","unstructured":"Yan Y, Ricci E, Subramanian R, Liu G, Lanz O, Sebe N. A multi-task learning framework for head pose estimation under target motion, IEEE Transactions on Pattern Analysis and Machine Intelligence (TPAMI), in press","DOI":"10.1109\/TPAMI.2015.2477843"},{"issue":"7","key":"3294_CR30","doi-asserted-by":"crossref","first-page":"99","DOI":"10.1016\/j.cviu.2014.02.006","volume":"124","author":"Y Yan","year":"2014","unstructured":"Yan Y, Shen H, Liu G, Ma Z, Gao C, Sebe N (2014) GLocal tells you more: coupling glocal structural for feature selection with sparsity for image and video classification. Comp Vision Image Underst (CVIU) 124(7):99\u2013109","journal-title":"Comp Vision Image Underst (CVIU)"},{"issue":"3","key":"3294_CR31","doi-asserted-by":"crossref","first-page":"661","DOI":"10.1109\/TMM.2012.2237023","volume":"15","author":"Y Yang","year":"2012","unstructured":"Yang Y, Ma Z, Hauptmann AG, Sebe N (2012) Feature selection for multimedia analysis by sharing information among multiple tasks. IEEE Trans Multimed 15(3):661\u2013669","journal-title":"IEEE Trans Multimed"},{"issue":"5","key":"3294_CR32","doi-asserted-by":"crossref","first-page":"723","DOI":"10.1109\/TPAMI.2011.170","volume":"34","author":"Y Yang","year":"2012","unstructured":"Yang Y, Nie F, Xu D, Luo J, Zhuang Y, Pan Y (2012) A multimedia retrieval framework based on semi-supervised ranking and relevance feedback. IEEE Trans Pattern Anal Mach Intell (TPAMI) 34(5):723\u2013742","journal-title":"IEEE Trans Pattern Anal Mach Intell (TPAMI)"},{"issue":"3","key":"3294_CR33","doi-asserted-by":"crossref","first-page":"572","DOI":"10.1109\/TMM.2012.2234731","volume":"15","author":"Y Yang","year":"2013","unstructured":"Yang Y, Song J, Huang Z, Ma Z, Sebe N, Hauptmann AG (2013) Multi-feature fusion via hierarchical regression for multimedia analysis. IEEE Trans Multimedia 15(3):572\u201358","journal-title":"IEEE Trans Multimedia"},{"issue":"3","key":"3294_CR34","doi-asserted-by":"crossref","first-page":"437","DOI":"10.1109\/TMM.2008.917359","volume":"10","author":"Y Yang","year":"2008","unstructured":"Yang Y, Zhuang Y, Wu F, Pan Y (2008) Harmonizing hierarchical manifolds for multimedia document semantics understanding and cross-media retrieval. IEEE Transactions on Multimedia 10(3):437\u2013446","journal-title":"IEEE Transactions on Multimedia"},{"key":"3294_CR35","doi-asserted-by":"crossref","unstructured":"Yu Z, Wu F, Yang Y, Tian Q, Luo J, Zhuang Y (2014) Discriminative coupled dictionary hashing for fast cross-media retrieval. SIGIR, 395\u2013404","DOI":"10.1145\/2600428.2609563"},{"key":"3294_CR36","doi-asserted-by":"crossref","first-page":"10","DOI":"10.1016\/j.neucom.2012.03.033","volume":"119","author":"H Zhang","year":"2013","unstructured":"Zhang H, Liu Y, Ma Z (2013) Fusing inherent and external knowledge with nonlinear learning for cross-media retrieval. Neurocomputing 119:10\u201316","journal-title":"Neurocomputing"},{"key":"3294_CR37","doi-asserted-by":"crossref","first-page":"93","DOI":"10.1016\/j.neucom.2015.07.104","volume":"173","author":"H Zhang","year":"2016","unstructured":"Zhang H, Wu P, Beck A, Zhang Z, Gao X (2016) Adaptive incremental learning of image semantics with application to social robot. Neurocomputing 173:93\u2013101","journal-title":"Neurocomputing"},{"key":"3294_CR38","doi-asserted-by":"crossref","first-page":"100","DOI":"10.1016\/j.neucom.2012.03.007","volume":"93","author":"H Zhang","year":"2012","unstructured":"Zhang H, Yu J, Wang M, Liu Y (2012) Semi-supervised distance metric learning based on local linear regression for data clustering. Neurocomputing 93:100\u2013105","journal-title":"Neurocomputing"},{"key":"3294_CR39","doi-asserted-by":"crossref","unstructured":"Zhang H, Yuan J, Gao X, Chen Z (2014) Boosting cross-media retrieval via visual-auditory feature analysis and relevance feedback. ACM International Conference on Multimedia","DOI":"10.1145\/2647868.2654975"},{"issue":"2","key":"3294_CR40","doi-asserted-by":"crossref","first-page":"221","DOI":"10.1109\/TMM.2007.911822","volume":"10","author":"Y Zhuang","year":"2008","unstructured":"Zhuang Y, Yang Y, Wu F (2008) Mining semantic correlation of heterogeneous multimedia data for cross-media retrieval. IEEE Transactions on Multimedia 10(2):221\u2013229","journal-title":"IEEE Transactions on Multimedia"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-016-3294-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s11042-016-3294-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-016-3294-5","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,9,4]],"date-time":"2019-09-04T22:05:40Z","timestamp":1567634740000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s11042-016-3294-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,2,23]]},"references-count":40,"journal-issue":{"issue":"15","published-print":{"date-parts":[[2016,8]]}},"alternative-id":["3294"],"URL":"https:\/\/doi.org\/10.1007\/s11042-016-3294-5","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"value":"1380-7501","type":"print"},{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2016,2,23]]}}}