{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,20]],"date-time":"2026-04-20T23:51:44Z","timestamp":1776729104501,"version":"3.51.2"},"reference-count":89,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2021,2,17]],"date-time":"2021-02-17T00:00:00Z","timestamp":1613520000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,2,17]],"date-time":"2021-02-17T00:00:00Z","timestamp":1613520000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Neural Process Lett"],"published-print":{"date-parts":[[2021,4]]},"DOI":"10.1007\/s11063-021-10438-5","type":"journal-article","created":{"date-parts":[[2021,2,19]],"date-time":"2021-02-19T06:11:29Z","timestamp":1613715089000},"page":"1229-1251","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":10,"title":["aiTPR: Attribute Interaction-Tensor Product Representation for Image Caption"],"prefix":"10.1007","volume":"53","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-1563-9304","authenticated-orcid":false,"given":"Chiranjib","family":"Sur","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,2,17]]},"reference":[{"key":"10438_CR1","unstructured":"Ren S, He K, Girshick R, Sun J (2015). Faster R-CNN: towards real-time object detection with region proposal networks. In: Advances in neural information processing systems, pp 91\u201399"},{"key":"10438_CR2","unstructured":"Gan Z et al (2016) Semantic compositional networks for visual captioning. arXiv preprint arXiv:1611.08002"},{"key":"10438_CR3","unstructured":"Sur C (2019) Representations for vision language intelligence using tensor product representation. Ph.D. dissertation, University of Florida"},{"key":"10438_CR4","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s11042-019-08021-1","volume":"78","author":"C Sur","year":"2019","unstructured":"Sur C (2019) Survey of deep learning and architectures for visual captioning-transitioning between media and natural languages. Multimedia Tools Appl 78:1\u201351","journal-title":"Multimedia Tools Appl"},{"issue":"11","key":"10438_CR5","doi-asserted-by":"publisher","first-page":"2483","DOI":"10.1007\/s11517-019-02038-2","volume":"57","author":"C Sur","year":"2019","unstructured":"Sur C (2019) GSIAR: gene-subcategory interaction-based improved deep representation learning for breast cancer subcategorical analysis using gene expression, applicable for precision medicine. Med Biol Eng Comput 57(11):2483\u20132515","journal-title":"Med Biol Eng Comput"},{"key":"10438_CR6","doi-asserted-by":"crossref","unstructured":"Karpathy A, Fei-Fei L (2015) Deep visual-semantic alignments for generating image descriptions. In: Proceedings of the IEEE conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR.2015.7298932"},{"key":"10438_CR7","doi-asserted-by":"crossref","unstructured":"Devlin J et al (2015) Language models for image captioning: the quirks and what works. arXiv preprint arXiv:1505.01809","DOI":"10.3115\/v1\/P15-2017"},{"key":"10438_CR8","doi-asserted-by":"crossref","unstructured":"Vinyals O et al (2015) Show and tell: a neural image caption generator. In: Proceedings of the IEEE conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR.2015.7298935"},{"key":"10438_CR9","doi-asserted-by":"crossref","unstructured":"Chen X, Lawrence Zitnick C (2015) Mind\u2019s eye: a recurrent visual representation for image caption generation. In: Proceedings of the IEEE conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR.2015.7298856"},{"key":"10438_CR10","unstructured":"Devlin, J, Gupta, S, Girshick, R, Mitchell, M, Zitnick, C. L. (2015). Exploring nearest neighbor approaches for image captioning. arXiv preprint arXiv:1505.04467"},{"issue":"1","key":"10438_CR11","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1007\/s41688-019-0035-8","volume":"3","author":"S Chiranjib","year":"2019","unstructured":"Chiranjib S (2019) A Multi-Modular System-Genetics (MMSG) approach for deep representation learning for personalized treatment of cancer using sensitivity analysis of precision drugs and gene expression data. Data-Enabled Discov Appl 3(1):11","journal-title":"Data-Enabled Discov Appl"},{"key":"10438_CR12","unstructured":"Xu K et al (2015) Show, attend and tell: neural image caption generation with visual attention. In: International conference on machine learning"},{"key":"10438_CR13","unstructured":"Mao J et al (2014) Deep captioning with multimodal recurrent neural networks (M-RNN). arXiv preprint arXiv:1412.6632"},{"key":"10438_CR14","doi-asserted-by":"crossref","unstructured":"Yao T, Pan Y, Li Y, Qiu Z, Mei T (2017) Boosting image captioning with attributes. In: IEEE international conference on computer vision, ICCV, pp 22\u201329","DOI":"10.1109\/ICCV.2017.524"},{"key":"10438_CR15","doi-asserted-by":"crossref","unstructured":"Rennie SJ, Marcheret E, Mroueh Y, Ross J, Goel V (2017) Self-critical sequence training for image captioning. In: CVPR, vol 1, no 2, p 3","DOI":"10.1109\/CVPR.2017.131"},{"key":"10438_CR16","doi-asserted-by":"crossref","unstructured":"Chen H, Ding G, Lin Z, Zhao S, Han J (2018) Show, observe and tell: attribute-driven attention model for image captioning. In: IJCAI, pp 606\u2013612","DOI":"10.24963\/ijcai.2018\/84"},{"key":"10438_CR17","doi-asserted-by":"crossref","unstructured":"Yao T, Pan Y, Li Y, Mei T (2018) Exploring visual relationship for image captioning. In: Proceedings of the European conference on computer vision (ECCV), pp 684\u2013699","DOI":"10.1007\/978-3-030-01264-9_42"},{"issue":"1\u20132","key":"10438_CR18","first-page":"159","volume":"46","author":"S Paul","year":"1990","unstructured":"Paul S (1990) Tensor product variable binding and the representation of symbolic structures in connectionist systems. Artif Intell 46(1\u20132):159\u2013216","journal-title":"Artif Intell"},{"key":"10438_CR19","doi-asserted-by":"crossref","unstructured":"Lu D, Whitehead S, Huang L, Ji H, Chang SF (2018) Entity-aware image caption generation. arXiv preprint arXiv:1804.07889","DOI":"10.18653\/v1\/D18-1435"},{"key":"10438_CR20","doi-asserted-by":"crossref","unstructured":"Lu J, Yang J, Batra D, Parikh D (2018) Neural baby talk. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 7219\u20137228","DOI":"10.1109\/CVPR.2018.00754"},{"key":"10438_CR21","unstructured":"You Q, Jin H, Luo J (2018) Image captioning at will: a versatile scheme for effectively injecting sentiments into image descriptions. arXiv preprint arXiv:1801.10121"},{"key":"10438_CR22","unstructured":"Melnyk I, Sercu T, Dognin PL, Ross J, Mroueh Y (2018) Improved image captioning with adversarial semantic alignment. arXiv preprint arXiv:1805.00063"},{"key":"10438_CR23","unstructured":"Wu J, Hu Z, Mooney RJ (2018) Joint image captioning and question answering. arXiv preprint arXiv:1805.08389"},{"key":"10438_CR24","doi-asserted-by":"crossref","unstructured":"Chen F, Ji R, Su J, Wu Y, Wu Y (2017) Structcap: structured semantic embedding for image captioning. In: Proceedings of the 2017 ACM on multimedia conference. ACM, pp 46\u201354","DOI":"10.1145\/3123266.3123275"},{"key":"10438_CR25","doi-asserted-by":"crossref","unstructured":"Jiang W, Ma L, Chen X, Zhang H, Liu W (2018) Learning to guide decoding for image captioning. arXiv preprint arXiv:1804.00887","DOI":"10.1609\/aaai.v32i1.12283"},{"key":"10438_CR26","first-page":"100","volume":"67","author":"C Wu","year":"2018","unstructured":"Wu C, Wei Y, Chu X, Su F, Wang L (2018) Modeling visual and word-conditional semantic attention for image captioning. Signal Process: Image Commun 67:100\u2013107","journal-title":"Signal Process: Image Commun"},{"key":"10438_CR27","first-page":"1","volume":"99","author":"K Fu","year":"2018","unstructured":"Fu K, Li J, Jin J, Zhang C (2018) Image-text surgery: efficient concept learning in image captioning by generating pseudopairs. IEEE Trans Neural Netw Learn Syst 99:1\u201312","journal-title":"IEEE Trans Neural Netw Learn Syst"},{"issue":"2","key":"10438_CR28","first-page":"48","volume":"14","author":"M Cornia","year":"2018","unstructured":"Cornia M, Baraldi L, Serra G, Cucchiara R (2018) Paying more attention to saliency: image captioning with saliency and context attention. ACM Trans Multimedia Comput Commun Appl (TOMM) 14(2):48","journal-title":"ACM Trans Multimedia Comput Commun Appl (TOMM)"},{"key":"10438_CR29","doi-asserted-by":"crossref","unstructured":"Zhao W, Wang B, Ye J, Yang M, Zhao Z, Luo R, Qiao Y (2018) A multi-task learning approach for image captioning. In: IJCAI, pp 1205\u20131211","DOI":"10.24963\/ijcai.2018\/168"},{"key":"10438_CR30","unstructured":"Li X, Wang X, Xu C, Lan W, Wei Q, Yang G, Xu J (2018) COCO-CN for cross-lingual image tagging, captioning and retrieval. arXiv preprint arXiv:1805.08661"},{"key":"10438_CR31","doi-asserted-by":"crossref","unstructured":"Sur C, Liu P, Zhou Y, Wu D (2019) Semantic tensor product for image captioning. In: 2019 5th international conference on big data computing and communications (BIGCOM). IEEE, pp 33\u201337","DOI":"10.1109\/BIGCOM.2019.00013"},{"key":"10438_CR32","doi-asserted-by":"crossref","unstructured":"Chen M, Ding G, Zhao S, Chen H, Liu Q, Han J (2017) Reference based LSTM for image captioning. In: AAAI, pp 3981\u20133987","DOI":"10.1609\/aaai.v31i1.11198"},{"key":"10438_CR33","unstructured":"Chen H, Zhang H, Chen PY, Yi J, Hsieh CJ (2017) Show-and-fool: crafting adversarial examples for neural image captioning. arXiv preprint arXiv:1712.02051"},{"key":"10438_CR34","doi-asserted-by":"publisher","first-page":"228","DOI":"10.1007\/s42979-020-00234-8","volume":"1","author":"C Sur","year":"2020","unstructured":"Sur C (2020) GenAtSeq GAN with heuristic reforms for knowledge centric network with browsing characteristics learning, individual tracking and malware detection with Website2Vec. SN Comput Sci 1:228. https:\/\/doi.org\/10.1007\/s42979-020-00234-8","journal-title":"SN Comput Sci"},{"key":"10438_CR35","doi-asserted-by":"publisher","first-page":"5514","DOI":"10.1109\/TIP.2018.2855406","volume":"27","author":"S Ye","year":"2018","unstructured":"Ye S, Liu N, Han J (2018) Attentive linear transformation for image captioning. IEEE Trans Image Process 27:5514\u20135524","journal-title":"IEEE Trans Image Process"},{"key":"10438_CR36","doi-asserted-by":"crossref","unstructured":"Wang Y, Lin Z, Shen X, Cohen S, Cottrell GW (2017) Skeleton key: image captioning by skeleton-attribute decomposition. arXiv preprint arXiv:1704.06972","DOI":"10.1109\/CVPR.2017.780"},{"key":"10438_CR37","doi-asserted-by":"crossref","unstructured":"Chen T, Zhang Z, You Q, Fang C, Wang Z, Jin H, Luo J (2018) \u201cFactual\u201d or \u201cEmotional\u201d: stylized image captioning with adaptive learning and attention. arXiv preprint arXiv:1807.03871","DOI":"10.1007\/978-3-030-01249-6_32"},{"key":"10438_CR38","doi-asserted-by":"crossref","unstructured":"Chen F, Ji R, Sun X, Wu Y, Su J (2018) GroupCap: group-based image captioning with structured relevance and diversity constraints. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 1345\u20131353","DOI":"10.1109\/CVPR.2018.00146"},{"key":"10438_CR39","doi-asserted-by":"crossref","unstructured":"Liu C, Sun F, Wang C, Wang F, Yuille A (2017) MAT: a multimodal attentive translator for image captioning. arXiv preprint arXiv:1702.05658","DOI":"10.24963\/ijcai.2017\/563"},{"key":"10438_CR40","doi-asserted-by":"crossref","unstructured":"Harzig P, Brehm S, Lienhart R, Kaiser C, Schallner R (2018) Multimodal image captioning for marketing analysis. arXiv preprint arXiv:1802.01958","DOI":"10.1109\/MIPR.2018.00035"},{"key":"10438_CR41","doi-asserted-by":"crossref","unstructured":"Liu X, Li H, Shao J, Chen D, Wang X (2018) Show, tell and discriminate: image captioning by self-retrieval with partially labeled data. arXiv preprint arXiv:1803.08314","DOI":"10.1007\/978-3-030-01267-0_21"},{"key":"10438_CR42","unstructured":"Chunseong Park C, Kim B, Kim G (2017) Attend to you: personalized image captioning with context sequence memory networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 895\u2013903"},{"key":"10438_CR43","doi-asserted-by":"crossref","unstructured":"Sharma P, Ding N, Goodman S, Soricut R (2018) Conceptual captions: a cleaned, Hypernymed, image alt-text dataset for automatic image captioning. In: Proceedings of the 56th annual meeting of the association for computational linguistics, vol 1. Long Papers, pp 2556\u20132565","DOI":"10.18653\/v1\/P18-1238"},{"key":"10438_CR44","doi-asserted-by":"crossref","unstructured":"Yao T, Pan Y, Li Y, Mei T (2017) Incorporating copying mechanism in image captioning for learning novel objects. In: 2017 IEEE conference on computer vision and pattern recognition (CVPR). IEEE, pp 5263\u20135271","DOI":"10.1109\/CVPR.2017.559"},{"issue":"9","key":"10438_CR45","doi-asserted-by":"publisher","first-page":"3573","DOI":"10.1007\/s12652-018-1084-9","volume":"10","author":"S Chiranjib","year":"2019","unstructured":"Chiranjib S (2019) DeepSeq: learning browsing log data based personalized security vulnerabilities and counter intelligent measures. J Ambient Intell Human Comput 10(9):3573\u20133602","journal-title":"J Ambient Intell Human Comput"},{"key":"10438_CR46","unstructured":"Zhang L, Sung F, Liu F, Xiang T, Gong S, Yang Y, Hospedales TM (2017) Actor-critic sequence training for image captioning. arXiv preprint arXiv:1706.09601"},{"key":"10438_CR47","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s12065-018-0165-1","volume":"12","author":"C Sur","year":"2019","unstructured":"Sur C (2019) UCRLF: unified constrained reinforcement learning framework for phase-aware architectures for autonomous vehicle signaling and trajectory optimization. Evolut Intell 12:1\u201324","journal-title":"Evolut Intell"},{"issue":"12","key":"10438_CR48","doi-asserted-by":"publisher","first-page":"2321","DOI":"10.1109\/TPAMI.2016.2642953","volume":"39","author":"K Fu","year":"2017","unstructured":"Fu K, Jin J, Cui R, Sha F, Zhang C (2017) Aligning where to see and what to tell: image captioning with region-based attention and scene-specific contexts. IEEE Trans Pattern Anal Mach Intell 39(12):2321\u20132334","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"10438_CR49","doi-asserted-by":"crossref","unstructured":"Ren Z, Wang X, Zhang N, Lv X, Li LJ (2017) Deep reinforcement learning-based image captioning with embedding reward. arXiv preprint arXiv:1704.03899","DOI":"10.1109\/CVPR.2017.128"},{"key":"10438_CR50","doi-asserted-by":"crossref","unstructured":"Liu S, Zhu Z, Ye N, Guadarrama S, Murphy K (2017) Improved image captioning via policy gradient optimization of spider. In: Proceedings on IEEE international conference on computer vision, vol 3, p 3","DOI":"10.1109\/ICCV.2017.100"},{"key":"10438_CR51","unstructured":"Cohn-Gordon R, Goodman N, Potts C (2018) Pragmatically informative image captioning with character-level reference. arXiv preprint arXiv:1804.05417"},{"key":"10438_CR52","doi-asserted-by":"crossref","unstructured":"Liu C, Mao J, Sha F, Yuille AL (2017) Attention correctness in neural image captioning. In: AAAI, pp 4176\u20134182","DOI":"10.1609\/aaai.v31i1.11197"},{"key":"10438_CR53","doi-asserted-by":"crossref","unstructured":"Lu J, Xiong C, Parikh D, Socher R (2017) Knowing when to look: adaptive attention via a visual sentinel for image captioning. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), vol 6, p 2","DOI":"10.1109\/CVPR.2017.345"},{"issue":"4","key":"10438_CR54","doi-asserted-by":"publisher","first-page":"652","DOI":"10.1109\/TPAMI.2016.2587640","volume":"39","author":"O Vinyals","year":"2017","unstructured":"Vinyals O, Toshev A, Bengio S, Erhan D (2017) Show and tell: lessons learned from the 2015 MSCOCO image captioning challenge. IEEE Trans Pattern Anal Mach Intell 39(4):652\u2013663","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"10438_CR55","doi-asserted-by":"publisher","first-page":"32","DOI":"10.1109\/TIP.2018.2855415","volume":"28","author":"M Zhang","year":"2018","unstructured":"Zhang M, Yang Y, Zhang H, Ji Y, Shen HT, Chua TS (2018) More is better: precise and detailed image captioning using online positive recall and missing concepts mining. IEEE Trans Image Process 28:32\u201344","journal-title":"IEEE Trans Image Process"},{"key":"10438_CR56","doi-asserted-by":"publisher","first-page":"999","DOI":"10.1109\/TPAMI.2018.2824816","volume":"41","author":"CC Park","year":"2018","unstructured":"Park CC, Kim B, Kim G (2018) Towards personalized image captioning via multimodal memory networks. IEEE Trans Pattern Anal Mach Intell 41:999\u20131012","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"10438_CR57","doi-asserted-by":"publisher","first-page":"1367","DOI":"10.1109\/TPAMI.2017.2708709","volume":"40","author":"Q Wu","year":"2017","unstructured":"Wu Q, Shen C, Wang P, Dick A, van den Hengel A (2017) Image captioning and visual question answering based on attributes and external knowledge. IEEE Trans Pattern Anal Mach Intell 40:1367\u20131381","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"10438_CR58","doi-asserted-by":"crossref","unstructured":"Gan C et al (2017) Stylenet: generating attractive visual captions with styles. In: CVPR","DOI":"10.1109\/CVPR.2017.108"},{"key":"10438_CR59","unstructured":"Jin J et al (2015) Aligning where to see and what to tell: image caption with region-based attention and scene factorization. arXiv preprint arXiv:1506.06272"},{"key":"10438_CR60","unstructured":"Kiros R, Salakhutdinov R, Zemel RS (2014) Unifying visual-semantic embeddings with multimodal neural language models. arXiv preprint arXiv:1411.2539"},{"key":"10438_CR61","unstructured":"Pu Y et al (2016) Variational autoencoder for deep learning of images, labels and captions. In: Advances in neural information processing systems"},{"key":"10438_CR62","doi-asserted-by":"publisher","first-page":"207","DOI":"10.1162\/tacl_a_00177","volume":"2","author":"R Socher","year":"2014","unstructured":"Socher R et al (2014) Grounded compositional semantics for finding and describing images with sentences. Trans Assoc Comput Linguist 2:207\u2013218","journal-title":"Trans Assoc Comput Linguist"},{"key":"10438_CR63","unstructured":"Sutskever I, Martens J, Hinton GE (2011) Generating text with recurrent neural networks. In: Proceedings of the 28th international conference on machine learning (ICML-11)"},{"key":"10438_CR64","unstructured":"Ilya S, Oriol V, Le QV (2014) Sequence to sequence learning with neural networks. In: Advances in neural information processing systems"},{"key":"10438_CR65","doi-asserted-by":"crossref","unstructured":"LTran D et al (2015) Learning spatiotemporal features with 3d convolutional networks. In: Proceedings of the IEEE international conference on computer vision","DOI":"10.1109\/ICCV.2015.510"},{"key":"10438_CR66","doi-asserted-by":"crossref","unstructured":"Tran K et al (2016) Rich image captioning in the wild. In: Proceedings of the IEEE conference on computer vision and pattern recognition workshops","DOI":"10.1109\/CVPRW.2016.61"},{"key":"10438_CR67","doi-asserted-by":"crossref","unstructured":"You Q et al (2016) Image captioning with semantic attention. In: Proceedings of the IEEE conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR.2016.503"},{"key":"10438_CR68","doi-asserted-by":"crossref","unstructured":"Girshick R et al (2014) Rich feature hierarchies for accurate object detection and semantic segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR.2014.81"},{"key":"10438_CR69","doi-asserted-by":"crossref","unstructured":"Jia X et al (2015) Guiding the long-short term memory model for image caption generation. In: Proceedings of the IEEE international conference on computer vision","DOI":"10.1109\/ICCV.2015.277"},{"issue":"12","key":"10438_CR70","doi-asserted-by":"publisher","first-page":"2891","DOI":"10.1109\/TPAMI.2012.162","volume":"35","author":"G Kulkarni","year":"2013","unstructured":"Kulkarni G et al (2013) Babytalk: understanding and generating simple image descriptions. IEEE Trans Pattern Anal Mach Intell 35(12):2891\u20132903","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"10","key":"10438_CR71","doi-asserted-by":"publisher","first-page":"351","DOI":"10.1162\/tacl_a_00188","volume":"2","author":"P Kuznetsova","year":"2014","unstructured":"Kuznetsova P et al (2014) TREETALK: composition and compression of trees for image descriptions. TACL 2(10):351\u2013362","journal-title":"TACL"},{"key":"10438_CR72","doi-asserted-by":"crossref","unstructured":"Mao J et al (2015) Learning like a child: fast novel visual concept learning from sentence descriptions of images. In: Proceedings of the IEEE international conference on computer vision","DOI":"10.1109\/ICCV.2015.291"},{"key":"10438_CR73","doi-asserted-by":"crossref","unstructured":"Mathews A, Xie L, He X (2016) SentiCap: generating image descriptions with sentiments. In: AAAI","DOI":"10.1609\/aaai.v30i1.10475"},{"key":"10438_CR74","unstructured":"Yang Y et al (2011) Corpus-guided sentence generation of natural images. In: Proceedings of the conference on empirical methods in natural language processing. Association for Computational Linguistics"},{"key":"10438_CR75","unstructured":"Sur C (2020) SACT: self-aware multi-space feature composition transformer for multinomial attention for video captioning. arXiv preprint arXiv:2006.14262"},{"key":"10438_CR76","unstructured":"Sur C (2020) Self-segregating and coordinated-segregating transformer for focused deep multi-modular network for visual question answering. arXiv preprint arXiv:2006.14264"},{"key":"10438_CR77","unstructured":"Sur C (2020) ReLGAN: generalization of consistency for GAN with disjoint constraints and relative learning of generative processes for multiple transformation learning. arXiv preprint arXiv:2006.07809"},{"key":"10438_CR78","doi-asserted-by":"publisher","first-page":"229","DOI":"10.1007\/s42979-020-00238-4","volume":"1","author":"C Sur","year":"2020","unstructured":"Sur C (2020) AACR: feature fusion effects of algebraic amalgamation composed representation on (de)compositional network for caption generation for images. SN Comput Sci 1:229. https:\/\/doi.org\/10.1007\/s42979-020-00238-4","journal-title":"SN Comput Sci"},{"key":"10438_CR79","unstructured":"Sur C (2020) Gaussian Smoothen Semantic Features (GSSF)\u2014exploring the linguistic aspects of visual captioning in Indian Languages (Bengali) using MSCOCO framework. arXiv preprint arXiv:2002.06701"},{"key":"10438_CR80","unstructured":"Sur C (2020) MRRC: multiple role representation crossover interpretation for image captioning with R-CNN feature distribution composition (FDC). arXiv preprint arXiv:2002.06436"},{"key":"10438_CR81","unstructured":"Sur C (2019) CRUR: coupled-recurrent unit for unification, conceptualization and context capture for language representation\u2014a generalization of bi directional LSTM. arXiv preprint arXiv:1911.10132"},{"issue":"1","key":"10438_CR82","first-page":"22","volume":"2","author":"S Chiranjib","year":"2020","unstructured":"Chiranjib S (2020) RBN: enhancement in language attribute prediction using global representation of natural language transfer learning technology like Google BERT. SN Appl Sci 2(1):22","journal-title":"SN Appl Sci"},{"key":"10438_CR83","unstructured":"Sur C (2019) Tpsgtr: neural-symbolic tensor product scene-graph-triplet representation for image captioning. arXiv preprint arXiv:1911.10115"},{"key":"10438_CR84","unstructured":"Sur C (2018) Feature fusion effects of tensor product representation on (de) compositional network for caption generation for images. arXiv preprint arXiv:1812.06624"},{"key":"10438_CR85","doi-asserted-by":"crossref","unstructured":"Donahue J et al. (2015) Long-term recurrent convolutional networks for visual recognition and description. In: Proceedings of the IEEE conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR.2015.7298878"},{"key":"10438_CR86","doi-asserted-by":"crossref","unstructured":"Fang H et al (2015) From captions to visual concepts and back. In: Proceedings of the IEEE conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR.2015.7298754"},{"issue":"2s","key":"10438_CR87","first-page":"40","volume":"14","author":"C Wang","year":"2018","unstructured":"Wang C, Yang H, Bartz C, Meinel C (2018) Image captioning with deep bidirectional LSTMs and multi-task learning. ACM Trans Multimedia Comput Commun Appl (TOMM) 14(2s):40","journal-title":"ACM Trans Multimedia Comput Commun Appl (TOMM)"},{"key":"10438_CR88","doi-asserted-by":"crossref","unstructured":"Anderson P, He X, Buehler C, Teney D, Johnson M, Gould S, Zhang L (2018) Bottom-up and top-down attention for image captioning and visual question answering. In: CVPR, vol 3, no 5, p 6","DOI":"10.1109\/CVPR.2018.00636"},{"key":"10438_CR89","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s13735-020-00192-0","volume":"9","author":"C Sur","year":"2020","unstructured":"Sur C (2020) MRECN: mixed representation enhanced (de) compositional network for caption generation from visual features, modeling as pseudo tensor product representation. Int J Multimedia Inf Retr 9:1\u201326","journal-title":"Int J Multimedia Inf Retr"}],"container-title":["Neural Processing Letters"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11063-021-10438-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11063-021-10438-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11063-021-10438-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,18]],"date-time":"2022-12-18T04:43:50Z","timestamp":1671338630000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11063-021-10438-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,2,17]]},"references-count":89,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2021,4]]}},"alternative-id":["10438"],"URL":"https:\/\/doi.org\/10.1007\/s11063-021-10438-5","relation":{},"ISSN":["1370-4621","1573-773X"],"issn-type":[{"value":"1370-4621","type":"print"},{"value":"1573-773X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,2,17]]},"assertion":[{"value":"27 January 2021","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 February 2021","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Compliance with Ethical Standards"}},{"value":"On behalf of all authors, the corresponding author states that there is no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"This article does not contain any studies with human participants or animals performed by any of the authors.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical Approval"}}]}}