{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:22:04Z","timestamp":1750220524120,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":10,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,1,2]],"date-time":"2021-01-02T00:00:00Z","timestamp":1609545600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,1,2]]},"DOI":"10.1145\/3430984.3431059","type":"proceedings-article","created":{"date-parts":[[2020,12,28]],"date-time":"2020-12-28T05:34:44Z","timestamp":1609133684000},"page":"427-427","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Image Captioning with Pretrained Language Generators"],"prefix":"10.1145","author":[{"given":"Saketh","family":"Vishnubhatla","sequence":"first","affiliation":[{"name":"Bits Pilani Hyderabad Campus"}]},{"given":"Nishant","family":"Sinha","sequence":"additional","affiliation":[{"name":"OffNote Labs"}]}],"member":"320","published-online":{"date-parts":[[2021,1,2]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"crossref","unstructured":"Johnson et al.2016. DenseCap: Fully Convolutional Localization Networks for Dense Captioning.  Johnson et al.2016. DenseCap: Fully Convolutional Localization Networks for Dense Captioning.","DOI":"10.1109\/CVPR.2016.494"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"crossref","unstructured":"P.\u00a0Anderson et al.2018. Bottom-Up and Top-Down Attention for Image Captioning and Visual Question Answering.  P.\u00a0Anderson et al.2018. Bottom-Up and Top-Down Attention for Image Captioning and Visual Question Answering.","DOI":"10.1109\/CVPR.2018.00636"},{"key":"e_1_3_2_1_3_1","unstructured":"Radford et al.2018. Language models are unsupervised multitask learners. (2018).  Radford et al.2018. Language models are unsupervised multitask learners. (2018)."},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"crossref","unstructured":"Ting\u00a0Yao et al.2018. Exploring Visual Relationship for Image Captioning. (2018).  Ting\u00a0Yao et al.2018. Exploring Visual Relationship for Image Captioning. (2018).","DOI":"10.1007\/978-3-030-01264-9_42"},{"key":"e_1_3_2_1_5_1","unstructured":"Ranjay Krishna\u00a0et al.2016. Visual Genome.  Ranjay Krishna\u00a0et al.2016. Visual Genome."},{"key":"e_1_3_2_1_6_1","unstructured":"Jiasen Lu\u00a0et al.CVPR 2018. Neural baby talk.  Jiasen Lu\u00a0et al.CVPR 2018. Neural baby talk."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"crossref","unstructured":"Matt Post. 2018. A Call for Clarity in Reporting BLEU Scores.  Matt Post. 2018. A Call for Clarity in Reporting BLEU Scores.","DOI":"10.18653\/v1\/W18-6319"},{"key":"e_1_3_2_1_8_1","unstructured":"Colin Raffel\u00a0et al.2019. Exploring the limits of transfer learning with a unified text-to-text transformer. (2019).  Colin Raffel\u00a0et al.2019. Exploring the limits of transfer learning with a unified text-to-text transformer. (2019)."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"crossref","unstructured":"Kaihua Tang\u00a0et al.2020. Unbiased scene graph generation from biased training.  Kaihua Tang\u00a0et al.2020. Unbiased scene graph generation from biased training.","DOI":"10.1109\/CVPR42600.2020.00377"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"crossref","unstructured":"Dalin Wang Daniel Beck and Trevor Cohn. 2019. On the Role of Scene Graphs in Image Captioning.  Dalin Wang Daniel Beck and Trevor Cohn. 2019. On the Role of Scene Graphs in Image Captioning.","DOI":"10.1109\/CVPR.2019.01094"}],"event":{"name":"CODS COMAD 2021: 8th ACM IKDD CODS and 26th COMAD","acronym":"CODS COMAD 2021","location":"Bangalore India"},"container-title":["Proceedings of the 3rd ACM India Joint International Conference on Data Science &amp; Management of Data (8th ACM IKDD CODS &amp; 26th COMAD)"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3430984.3431059","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3430984.3431059","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T21:24:44Z","timestamp":1750195484000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3430984.3431059"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,1,2]]},"references-count":10,"alternative-id":["10.1145\/3430984.3431059","10.1145\/3430984"],"URL":"https:\/\/doi.org\/10.1145\/3430984.3431059","relation":{},"subject":[],"published":{"date-parts":[[2021,1,2]]},"assertion":[{"value":"2021-01-02","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}