{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,29]],"date-time":"2026-05-29T18:37:21Z","timestamp":1780079841527,"version":"3.54.0"},"reference-count":65,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100000732","name":"U.K.-India Education and Research Initiatives-Department of Science and Technology (UKIERI-DST), Government of India","doi-asserted-by":"publisher","award":["DSTKIERI-2018-19-10"],"award-info":[{"award-number":["DSTKIERI-2018-19-10"]}],"id":[{"id":"10.13039\/501100000732","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100010009","name":"Research Investment Fund at Edge Hill University","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100010009","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. on Image Process."],"published-print":{"date-parts":[[2021]]},"DOI":"10.1109\/tip.2021.3064256","type":"journal-article","created":{"date-parts":[[2021,3,11]],"date-time":"2021-03-11T21:07:13Z","timestamp":1615496833000},"page":"3691-3704","source":"Crossref","is-referenced-by-count":50,"title":["Attend and Guide (AG-Net): A Keypoints-Driven Attention-Based Deep Network for Image Recognition"],"prefix":"10.1109","volume":"30","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4546-076X","authenticated-orcid":false,"given":"Asish","family":"Bera","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5983-6468","authenticated-orcid":false,"given":"Zachary","family":"Wharton","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3774-2134","authenticated-orcid":false,"given":"Yonghuai","family":"Liu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6013-3935","authenticated-orcid":false,"given":"Nik","family":"Bessis","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0276-9000","authenticated-orcid":false,"given":"Ardhendu","family":"Behera","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/TCSS.2017.2766884"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1049\/iet-its.2011.0116"},{"key":"ref33","article-title":"Caltech-256 object category dataset","author":"griffin","year":"2007"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1145\/3329168"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10599-4_29"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.390"},{"key":"ref37","doi-asserted-by":"crossref","first-page":"1691","DOI":"10.1109\/TPAMI.2012.67","article-title":"Recognizing human-object interactions in still images by modeling the mutual context of objects and human poses","volume":"34","author":"yao","year":"2012","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2016.2605305"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00315"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2019.2934576"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2018.8546184"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-39601-9_4"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-15561-1_11"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-013-0636-x"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1016\/j.image.2017.03.010"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2016.10.001"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2010.5540234"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.74"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2016.03.002"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2014.04.018"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995368"},{"key":"ref20","first-page":"1","article-title":"Real-time distracted driver posture classification","volume":"abs 1706 9498","author":"abouelnaga","year":"2017","journal-title":"CoRR"},{"key":"ref22","first-page":"1","article-title":"Latent body-pose guided densenet for recognizing driver&#x2019;s fine-grained secondary activities","author":"behera","year":"2018","journal-title":"Proc IEEE Conf Adv Video Signal Based Surveill (AVSS"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1155\/2019\/4125865"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2011.6126386"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2018.00150"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/3343031.3350916"},{"key":"ref25","first-page":"152","article-title":"Loss guided activation for action recognition in still images","author":"liu","year":"2018","journal-title":"Proc Asian Conf Comput Vis"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.243"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46493-0_38"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00745"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_26"},{"key":"ref56","author":"bishop","year":"2006","journal-title":"Pattern Recognition and Machine Learning"},{"key":"ref55","first-page":"1097","article-title":"Imagenet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref54","first-page":"2825","article-title":"Explicit inductive bias for transfer learning with convolutional networks","author":"xuhong","year":"2018","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref53","first-page":"818","article-title":"Visualizing and understanding convolutional networks","author":"zeiler","year":"2014","journal-title":"Proc Eur Conf Comput Vis"},{"key":"ref52","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"2014","journal-title":"arXiv 1409 1556"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.284"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46448-0_25"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1007\/s11760-019-01589-z"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2019.2929447"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1023\/B:VISI.0000029664.99615.94"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/11744023_32"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2012.6248093"},{"key":"ref16","first-page":"58","article-title":"Action recognition via local descriptors and holistic features","author":"sun","year":"2009","journal-title":"Proc IEEE Comput Soc Conf Comput Vis Pattern Recognit Workshops"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2017.10.013"},{"key":"ref18","article-title":"Self-attention generative adversarial networks","author":"zhang","year":"2018","journal-title":"arXiv 1805 08318"},{"key":"ref19","first-page":"5998","article-title":"Attention is all you need","author":"vaswani","year":"2017","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TCDS.2017.2783944"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.367"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1504\/IJCVR.2020.104356"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00579"},{"key":"ref7","first-page":"1","article-title":"Neural machine translation by jointly learning to align and translate","author":"bahdanau","year":"2015","journal-title":"Proc 3rd Int Conf Learn Represent (ICLR)"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00907"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.129"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.325"},{"key":"ref45","first-page":"103","article-title":"Gpipe: Efficient training of giant neural networks using pipeline parallelism","author":"huang","year":"2019","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.308"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2016.03.004"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00432"},{"key":"ref41","article-title":"Fully convolutional attention networks for fine-grained recognition","author":"liu","year":"2016","journal-title":"arXiv 1603 06765"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2017.2758862"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/WACV.2018.00068"}],"container-title":["IEEE Transactions on Image Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/83\/9263394\/09376653.pdf?arnumber=9376653","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,10]],"date-time":"2022-05-10T14:51:12Z","timestamp":1652194272000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9376653\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021]]},"references-count":65,"URL":"https:\/\/doi.org\/10.1109\/tip.2021.3064256","relation":{},"ISSN":["1057-7149","1941-0042"],"issn-type":[{"value":"1057-7149","type":"print"},{"value":"1941-0042","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021]]}}}