{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,18]],"date-time":"2025-11-18T12:07:28Z","timestamp":1763467648129},"reference-count":11,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.1109\/icassp.2004.1326727","type":"proceedings-article","created":{"date-parts":[[2004,9,28]],"date-time":"2004-09-28T09:50:22Z","timestamp":1096365022000},"page":"iii-1044-7","source":"Crossref","is-referenced-by-count":36,"title":["Statistical models for automatic video annotation and retrieval"],"prefix":"10.1109","volume":"3","author":[{"given":"V.","family":"Lavrenko","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"S.L.","family":"Feng","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"R.","family":"Manmatha","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"3","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2004.1315274"},{"key":"2","first-page":"97","article-title":"Object recognition as machine translation: Learning a lexicon for a fixed image vocabulary","author":"duygulu","year":"2002","journal-title":"Seventh European Conf on Computer Vision"},{"year":"0","key":"10"},{"key":"1","doi-asserted-by":"publisher","DOI":"10.1145\/860458.860460"},{"key":"7","article-title":"Associating video frames with text","author":"duygulu","year":"2003","journal-title":"Proceedings of the SIGIR Multimedia Information Retrieval Workshop 2003"},{"key":"6","article-title":"A model for learning the semantics of pictures","author":"lavrenko","year":"0","journal-title":"Proceedings of NIPS'03"},{"key":"5","doi-asserted-by":"publisher","DOI":"10.1145\/290941.291008"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1145\/860458.860459"},{"key":"9","article-title":"The TREC-2002 video track report","author":"smeaton","year":"0","journal-title":"The Eleventh Text REtrieval Conf (TREC-2002)"},{"key":"8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2000.855895"},{"key":"11","article-title":"Experimental evaluation of a generative probabilistic image retrieval model on 'easy' data","author":"westerveld","year":"2003","journal-title":"Proceedings of the SIGIR Multimedia Information Retrieval Workshop 2003"}],"event":{"name":"2004 IEEE International Conference on Acoustics, Speech, and Signal Processing","acronym":"ICASSP-04","location":"Montreal, Que., Canada"},"container-title":["2004 IEEE International Conference on Acoustics, Speech, and Signal Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/9248\/29345\/01326727.pdf?arnumber=1326727","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,3,13]],"date-time":"2017-03-13T22:12:56Z","timestamp":1489443176000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/1326727\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[null]]},"references-count":11,"URL":"https:\/\/doi.org\/10.1109\/icassp.2004.1326727","relation":{},"subject":[]}}