{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,20]],"date-time":"2026-05-20T14:57:00Z","timestamp":1779289020657,"version":"3.51.4"},"reference-count":80,"publisher":"Springer Science and Business Media LLC","issue":"33","license":[{"start":{"date-parts":[[2024,3,2]],"date-time":"2024-03-02T00:00:00Z","timestamp":1709337600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,3,2]],"date-time":"2024-03-02T00:00:00Z","timestamp":1709337600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100006469","name":"Fundo para o Desenvolvimento das Ci\u00eancias e da Tecnologia","doi-asserted-by":"publisher","award":["0061\/2020\/A2"],"award-info":[{"award-number":["0061\/2020\/A2"]}],"id":[{"id":"10.13039\/501100006469","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-024-18598-x","type":"journal-article","created":{"date-parts":[[2024,3,2]],"date-time":"2024-03-02T07:01:52Z","timestamp":1709362912000},"page":"79985-80005","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Data reweighting net for web fine-grained image classification"],"prefix":"10.1007","volume":"83","author":[{"given":"Yifeng","family":"Liu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhenxin","family":"Wu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5296-0922","authenticated-orcid":false,"given":"Sio-long","family":"Lo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhenqiang","family":"Chen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Gang","family":"Ke","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chuan","family":"Yue","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,3,2]]},"reference":[{"issue":"5","key":"18598_CR1","doi-asserted-by":"publisher","first-page":"6807","DOI":"10.1007\/S11042-022-13423-9","volume":"82","author":"MM Balaha","year":"2023","unstructured":"Balaha MM, El-Kady S, Balaha HM, Salama M, Emad E, Hassan M, Saafan MM (2023) A vision-based deep learning approach for independent-users arabic sign language interpretation. Multim Tools Appl 82(5):6807\u20136826. https:\/\/doi.org\/10.1007\/S11042-022-13423-9","journal-title":"Multim Tools Appl"},{"issue":"29","key":"18598_CR2","doi-asserted-by":"publisher","first-page":"41899","DOI":"10.1007\/S11042-021-11473-Z","volume":"81","author":"U Ahmed","year":"2022","unstructured":"Ahmed U, Lin JC, Srivastava G (2022) Mitigating adversarial evasion attacks by deep active learning for medical image classification. Multim Tools Appl 81(29):41899\u201341910. https:\/\/doi.org\/10.1007\/S11042-021-11473-Z","journal-title":"Multim Tools Appl"},{"issue":"29","key":"18598_CR3","doi-asserted-by":"publisher","first-page":"42649","DOI":"10.1007\/S11042-022-13486-8","volume":"81","author":"A Sharma","year":"2022","unstructured":"Sharma A, Mishra PK (2022) Image enhancement techniques on deep learning approaches for automated diagnosis of COVID-19 features using CXR images. Multim Tools Appl 81(29):42649\u201342690. https:\/\/doi.org\/10.1007\/S11042-022-13486-8","journal-title":"Multim Tools Appl"},{"issue":"29","key":"18598_CR4","doi-asserted-by":"publisher","first-page":"42309","DOI":"10.1007\/S11042-022-13493-9","volume":"81","author":"R Raghavan","year":"2022","unstructured":"Raghavan R, Verma DC, Pandey D, Anand R, Pandey BK, Singh H (2022) Optimized building extraction from high-resolution satellite imagery using deep learning. Multim Tools Appl 81(29):42309\u201342323. https:\/\/doi.org\/10.1007\/S11042-022-13493-9","journal-title":"Multim Tools Appl"},{"issue":"30","key":"18598_CR5","doi-asserted-by":"publisher","first-page":"44291","DOI":"10.1007\/S11042-022-12892-2","volume":"81","author":"S Yadavendra Chand","year":"2022","unstructured":"Yadavendra Chand S (2022) Semantic segmentation and detection of satellite objects using u-net model of deep learning. Multim Tools Appl 81(30):44291\u201344310. https:\/\/doi.org\/10.1007\/S11042-022-12892-2","journal-title":"Multim Tools Appl"},{"issue":"1","key":"18598_CR6","doi-asserted-by":"publisher","first-page":"436","DOI":"10.1109\/TIP.2018.2869721","volume":"28","author":"Y Yao","year":"2019","unstructured":"Yao Y, Shen F, Zhang J, Liu L, Tang Z, Shao L (2019) Extracting privileged information for enhancing classifier learning. IEEE Trans Image Process 28(1):436\u2013450. https:\/\/doi.org\/10.1109\/TIP.2018.2869721","journal-title":"IEEE Trans Image Process"},{"issue":"1","key":"18598_CR7","doi-asserted-by":"publisher","first-page":"184","DOI":"10.1109\/TMM.2018.2847248","volume":"21","author":"Y Yao","year":"2019","unstructured":"Yao Y, Shen F, Zhang J, Liu L, Tang Z, Shao L (2019) Extracting multiple visual senses for web learning. IEEE Trans. Multim. 21(1):184\u2013196. https:\/\/doi.org\/10.1109\/TMM.2018.2847248","journal-title":"IEEE Trans. Multim."},{"key":"18598_CR8","doi-asserted-by":"publisher","unstructured":"Xie G-S, Liu L, Jin X, Zhu F, Zhang Z, Qin J, Yao Y, Shao L (2019) Attentive region embedding network for zero-shot learning. In: 2019 IEEE\/CVF Conference on computer vision and pattern recognition (CVPR), pp 9376\u20139385. https:\/\/doi.org\/10.1109\/CVPR.2019.00961","DOI":"10.1109\/CVPR.2019.00961"},{"key":"18598_CR9","doi-asserted-by":"publisher","unstructured":"Luo H, Lin G, Liu Z, Liu F, Tang Z, Yao Y (2019) Segeqa: video segmentation based visual attention for embodied question answering. In: 2019 IEEE\/CVF International conference on computer vision (ICCV), pp 9666\u20139675 . https:\/\/doi.org\/10.1109\/ICCV.2019.00976","DOI":"10.1109\/ICCV.2019.00976"},{"key":"18598_CR10","doi-asserted-by":"crossref","unstructured":"Xie G-S, Liu L, Zhu F, Zhao F, Zhang Z, Yao Y, Qin J, Shao L (2020) Region graph embedding network for zero-shot learning. In: Computer vision\u2013ECCV 2020: 16th European conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part IV 16, pp 562\u2013580 . Springer","DOI":"10.1007\/978-3-030-58548-8_33"},{"key":"18598_CR11","doi-asserted-by":"publisher","unstructured":"Yao Y, Hua X, Gao G, Sun Z, Li Z, Zhang J (2020) Bridging the web data and fine-grained visual recognition via alleviating label noise and domain mismatch. In: Proceedings of the 28th ACM international conference on multimedia. MM \u201920, pp 1735\u20131744. Association for Computing Machinery, New York, USA. https:\/\/doi.org\/10.1145\/3394171.3413851","DOI":"10.1145\/3394171.3413851"},{"key":"18598_CR12","doi-asserted-by":"publisher","unstructured":"Sun Z, Shen F, Huang D, Wang Q, Shu X, Yao Y, Tang J (2022) Pnp: robust learning from noisy labels by probabilistic noise prediction. In: 2022 IEEE\/CVF Conference on computer vision and pattern recognition (CVPR), pp 5301\u20135310. https:\/\/doi.org\/10.1109\/CVPR52688.2022.00524","DOI":"10.1109\/CVPR52688.2022.00524"},{"issue":"4","key":"18598_CR13","doi-asserted-by":"publisher","first-page":"905","DOI":"10.1109\/TPAMI.2017.2705122","volume":"40","author":"X Shu","year":"2018","unstructured":"Shu X, Tang J, Li Z, Lai H, Zhang L, Yan S (2018) Personalized age progression with bi-level aging dictionary learning. IEEE Trans Pattern Anal Mach Intell 40(4):905\u2013917. https:\/\/doi.org\/10.1109\/TPAMI.2017.2705122","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"3","key":"18598_CR14","doi-asserted-by":"publisher","first-page":"1110","DOI":"10.1109\/TPAMI.2019.2942030","volume":"43","author":"X Shu","year":"2021","unstructured":"Shu X, Tang J, Qi G, Liu W, Yang J (2021) Hierarchical long short-term concurrent memory for human interaction recognition. IEEE Trans Pattern Anal Mach Intell 43(3):1110\u20131118. https:\/\/doi.org\/10.1109\/TPAMI.2019.2942030","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"18598_CR15","doi-asserted-by":"publisher","unstructured":"Nie L, Yan S, Wang M, Hong R, Chua T-S (2012) Harvesting visual concepts for image search with complex queries. In: Proceedings of the 20th ACM international conference on multimedia. MM \u201912, pp 59\u201368. Association for Computing Machinery, New York, USA. https:\/\/doi.org\/10.1145\/2393347.2393363","DOI":"10.1145\/2393347.2393363"},{"issue":"8","key":"18598_CR16","doi-asserted-by":"publisher","first-page":"2107","DOI":"10.1109\/TKDE.2015.2399298","volume":"27","author":"L Nie","year":"2015","unstructured":"Nie L, Wang M, Zhang L, Yan S, Zhang B, Chua T (2015) Disease inference from health-related questions via sparse deep learning. IEEE Trans Knowl Data Eng 27(8):2107\u20132119. https:\/\/doi.org\/10.1109\/TKDE.2015.2399298","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"18598_CR17","doi-asserted-by":"publisher","unstructured":"Yao Y, Chen T, Xie G-S, Zhang C, Shen F, Wu Q, Tang Z, Zhang J (2021) Non-salient region object mining for weakly supervised semantic segmentation. In: 2021 IEEE\/CVF conference on computer vision and pattern recognition (CVPR), pp 2623\u20132632. https:\/\/doi.org\/10.1109\/CVPR46437.2021.00265","DOI":"10.1109\/CVPR46437.2021.00265"},{"issue":"2","key":"18598_CR18","doi-asserted-by":"publisher","first-page":"396","DOI":"10.1109\/TKDE.2014.2330813","volume":"27","author":"L Nie","year":"2015","unstructured":"Nie L, Zhao Y, Akbari M, Shen J, Chua T (2015) Bridging the vocabulary gap between health seekers and healthcare knowledge. IEEE Trans Knowl Data Eng 27(2):396\u2013409. https:\/\/doi.org\/10.1109\/TKDE.2014.2330813","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"18598_CR19","unstructured":"Wah C, Branson S, Welinder P, Perona P, Belongie S (2011) The caltech-ucsd birds-200-2011 dataset"},{"key":"18598_CR20","doi-asserted-by":"publisher","unstructured":"Krause J, Stark M, Deng J, Fei-Fei L (2013) 3d object representations for fine-grained categorization. In: 2013 IEEE International conference on computer vision workshops, pp 554\u2013561. https:\/\/doi.org\/10.1109\/ICCVW.2013.77","DOI":"10.1109\/ICCVW.2013.77"},{"key":"18598_CR21","unstructured":"Maji S, Rahtu E, Kannala J, Blaschko M, Vedaldi A (2013) Fine-grained visual classification of aircraft. arXiv:1306.5151"},{"issue":"8","key":"18598_CR22","doi-asserted-by":"publisher","first-page":"1771","DOI":"10.1109\/TMM.2017.2684626","volume":"19","author":"Y Yao","year":"2017","unstructured":"Yao Y, Zhang J, Shen F, Hua X, Xu J, Tang Z (2017) Exploiting web images for dataset construction: A domain robust approach. IEEE Trans Multim 19(8):1771\u20131784. https:\/\/doi.org\/10.1109\/TMM.2017.2684626","journal-title":"IEEE Trans Multim"},{"issue":"6","key":"18598_CR23","doi-asserted-by":"publisher","first-page":"1199","DOI":"10.1109\/TKDE.2019.2903036","volume":"32","author":"Y Yao","year":"2020","unstructured":"Yao Y, Zhang J, Shen F, Liu L, Zhu F, Zhang D, Shen HT (2020) Towards automatic construction of diverse, high-quality image datasets. IEEE Trans Knowl Data Eng 32(6):1199\u20131211. https:\/\/doi.org\/10.1109\/TKDE.2019.2903036","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"18598_CR24","doi-asserted-by":"publisher","unstructured":"Yao Y, Hua X-s, Shen F, Zhang J, Tang Z (2016) A domain robust approach for image dataset construction. In: Proceedings of the 24th ACM international conference on multimedia. MM \u201916, pp 212\u2013216. Association for Computing Machinery, New York, USA. https:\/\/doi.org\/10.1145\/2964284.2967213","DOI":"10.1145\/2964284.2967213"},{"key":"18598_CR25","doi-asserted-by":"publisher","unstructured":"Zhang C, Yao Y, Liu H, Xie G-S, Shu X, Zhou T, Zhang Z, Shen F, Tang Z (2020) Web-supervised network with softly update-drop training for fine-grained visual classification. Proceedings of the AAAI Conference on Artificial Intelligence 34(07):12781\u201312788. https:\/\/doi.org\/10.1609\/aaai.v34i07.6973","DOI":"10.1609\/aaai.v34i07.6973"},{"key":"18598_CR26","doi-asserted-by":"publisher","unstructured":"Sun Z, Hua X-S, Yao Y, Wei X-S, Hu G, Zhang J (2020) Crssc: salvage reusable samples from noisy data for robust learning. In: Proceedings of the 28th ACM international conference on multimedia. MM \u201920, pp 92\u2013101. Association for Computing Machinery, New York, USA. https:\/\/doi.org\/10.1145\/3394171.3413978","DOI":"10.1145\/3394171.3413978"},{"key":"18598_CR27","doi-asserted-by":"crossref","unstructured":"Sun Z, Yao Y, Wei X-S, Zhang Y, Shen F, Wu J, Zhang J, Shen HT (2021) Webly supervised fine-grained recognition: benchmark datasets and an approach. In: Proceedings of the IEEE\/CVF international conference on computer vision (ICCV), pp 10602\u201310611","DOI":"10.1109\/ICCV48922.2021.01043"},{"key":"18598_CR28","unstructured":"Arpit D, Jastrz\u0119bski S, Ballas N, Krueger D, Bengio E, Kanwal MS, Maharaj T, Fischer A, Courville A, Bengio Y, et\u00a0al. (2017) A closer look at memorization in deep networks. In: International conference on machine learning, pp 233\u2013242. PMLR"},{"issue":"3","key":"18598_CR29","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1145\/3446776","volume":"64","author":"C Zhang","year":"2021","unstructured":"Zhang C, Bengio S, Hardt M, Recht B, Vinyals O (2021) Understanding deep learning (still) requires rethinking generalization. Commun ACM 64(3):107\u2013115. https:\/\/doi.org\/10.1145\/3446776","journal-title":"Commun ACM"},{"issue":"2","key":"18598_CR30","doi-asserted-by":"publisher","first-page":"1845","DOI":"10.1007\/s11063-018-9963-9","volume":"50","author":"W Zhang","year":"2019","unstructured":"Zhang W, Wang D, Tan X (2019) Robust class-specific autoencoder for data cleaning and classification in the presence of label noise. Neural Process Lett 50(2):1845\u20131860. https:\/\/doi.org\/10.1007\/s11063-018-9963-9","journal-title":"Neural Process Lett"},{"key":"18598_CR31","unstructured":"Shu J, Xie Q, Yi L, Zhao Q, Zhou S, Xu Z, Meng D (2019) Meta-weight-net: learning an explicit mapping for sample weighting. Adv Neural Inform Process Syst 32"},{"key":"18598_CR32","first-page":"234","volume-title":"Medical image computing and computer-assisted intervention - MICCAI 2015","author":"O Ronneberger","year":"2015","unstructured":"Ronneberger O, Fischer P, Brox T (2015) U-net: convolutional networks for biomedical image segmentation. In: Navab N, Hornegger J, Wells WM, Frangi AF (eds) Medical image computing and computer-assisted intervention - MICCAI 2015. Springer, Cham, pp 234\u2013241"},{"key":"18598_CR33","doi-asserted-by":"crossref","unstructured":"Zhang N, Donahue J, Girshick R, Darrell T (2014) Part-based r-cnns for fine-grained category detection. In: Fleet D, Pajdla T, Schiele B, Tuytelaars T (eds) Computer Vision - ECCV 2014. Springer, Cham, pp 834\u2013849","DOI":"10.1007\/978-3-319-10590-1_54"},{"key":"18598_CR34","unstructured":"Wei X, Xie C, Wu J (2016) Mask-cnn: localizing parts and selecting descriptors for fine-grained image recognition. arXiv:1605.06878"},{"key":"18598_CR35","doi-asserted-by":"publisher","unstructured":"Lin D, Shen X, Lu C, Jia J (2015) Deep lac: deep localization, alignment and classification for fine-grained recognition. In: 2015 IEEE Conference on computer vision and pattern recognition (CVPR), pp 1666\u20131674. https:\/\/doi.org\/10.1109\/CVPR.2015.7298775","DOI":"10.1109\/CVPR.2015.7298775"},{"issue":"10","key":"18598_CR36","doi-asserted-by":"publisher","first-page":"14799","DOI":"10.1007\/s11042-022-13619-z","volume":"82","author":"X Nie","year":"2023","unstructured":"Nie X, Chai B, Wang L, Liao Q, Xu M (2023) Learning enhanced features and inferring twice for fine-grained image classification. Multim Tools Appl 82(10):14799\u201314813. https:\/\/doi.org\/10.1007\/s11042-022-13619-z","journal-title":"Multim Tools Appl"},{"key":"18598_CR37","doi-asserted-by":"publisher","unstructured":"Huang S, Xu Z, Tao D, Zhang Y (2016) Part-stacked cnn for fine-grained visual categorization. In: 2016 IEEE Conference on computer vision and pattern recognition (CVPR), pp 1173\u20131182. https:\/\/doi.org\/10.1109\/CVPR.2016.132","DOI":"10.1109\/CVPR.2016.132"},{"key":"18598_CR38","doi-asserted-by":"publisher","first-page":"153","DOI":"10.1007\/978-3-030-58565-5_10","volume-title":"Computer Vision - ECCV 2020","author":"R Du","year":"2020","unstructured":"Du R, Chang D, Bhunia AK, Xie J, Ma Z, Song Y-Z, Guo J (2020) Fine-grained visual classification via progressive multi-granularity training of jigsaw patches. In: Vedaldi A, Bischof H, Brox T, Frahm J-M (eds) Computer Vision - ECCV 2020. Springer, Cham, pp 153\u2013168"},{"key":"18598_CR39","unstructured":"Wu Z, Chen Q, Liu Y, Zhang Y, Zhu C, Yu Y (2021) Progressive multi-stage interactive training in mobile network for fine-grained recognition. arXiv:2112.04223"},{"key":"18598_CR40","doi-asserted-by":"crossref","unstructured":"Yang L, Li X, Song R, Zhao B, Tao J, Zhou S, Liang J, Yang J (2022) Dynamic mlp for fine-grained image classification by leveraging geographical and temporal information. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 10945\u201310954","DOI":"10.1109\/CVPR52688.2022.01067"},{"key":"18598_CR41","doi-asserted-by":"crossref","unstructured":"Wang Q, Wang J, Quan X, Feng F, Xu Z, Nie S, Wang S, Khabsa M, Firooz H, Liu D (2023) Mustie: multimodal structural transformer for web information extraction. In: Proceedings of the 61st annual meeting of the association for computational linguistics (vol 1: Long Papers), pp 2405\u20132420","DOI":"10.18653\/v1\/2023.acl-long.135"},{"key":"18598_CR42","doi-asserted-by":"publisher","unstructured":"Wang Q, Fang Y, Ravula A, Feng F, Quan X, Liu D (2022) Webformer: the web-page transformer for structure information extraction. In: Proceedings of the ACM Web conference 2022. WWW \u201922, pp 3124\u20133133. Association for Computing Machinery, New York, USA. https:\/\/doi.org\/10.1145\/3485447.3512032","DOI":"10.1145\/3485447.3512032"},{"key":"18598_CR43","first-page":"9978","volume":"2023","author":"L Yang","year":"2023","unstructured":"Yang L, Wang Q, Wang J, Quan X, Feng F, Chen Y, Khabsa M, Wang S, Xu Z, Liu D (2023) Mixpave: mix-prompt tuning for few-shot product attribute value extraction. Findings of the association for computational linguistics: ACL 2023:9978\u20139991","journal-title":"Findings of the association for computational linguistics: ACL"},{"key":"18598_CR44","doi-asserted-by":"publisher","first-page":"301","DOI":"10.1007\/978-3-319-46487-9_19","volume-title":"Computer Vision - ECCV 2016","author":"J Krause","year":"2016","unstructured":"Krause J, Sapp B, Howard A, Zhou H, Toshev A, Duerig T, Philbin J, Fei-Fei L (2016) The unreasonable effectiveness of noisy data for fine-grained recognition. In: Leibe B, Matas J, Sebe N, Welling M (eds) Computer Vision - ECCV 2016. Springer, Cham, pp 301\u2013320"},{"key":"18598_CR45","unstructured":"Han B, Yao Q, Yu X, Niu G, Xu M, Hu W, Tsang IW, Sugiyama M (2018) Co-teaching: robust training of deep neural networks with extremely noisy labels. In: Bengio S, Wallach HM, Larochelle H, Grauman K, Cesa-Bianchi N, Garnett R (eds) Advances in neural information processing systems 31: annual conference on neural information processing systems 2018, NeurIPS 2018, December 3-8, 2018, Montr\u00e9al, Canada, pp 8536\u20138546. https:\/\/proceedings.neurips.cc\/paper\/2018\/hash\/a19744e268754fb0148b01764 7355b7b-Abstract.html"},{"key":"18598_CR46","unstructured":"Yu X, Han B, Yao J, Niu G, Tsang I, Sugiyama M (2019) How does disagreement help generalization against label corruption? In: International conference on machine learning, pp 7164\u20137173. PMLR"},{"key":"18598_CR47","doi-asserted-by":"publisher","unstructured":"Liu D, Cui Y, Yan L, Mousas C, Yang B, Chen Y (2022) Densernet: weakly supervised visual localization using multi-scale feature aggregation. Proceedings of the AAAI conference on artificial intelligence 6101\u20136109. https:\/\/doi.org\/10.1609\/aaai.v35i7.16760","DOI":"10.1609\/aaai.v35i7.16760"},{"key":"18598_CR48","doi-asserted-by":"publisher","first-page":"2678","DOI":"10.1109\/TIP.2023.3272826","volume":"32","author":"D Liu","year":"2023","unstructured":"Liu D, Liang J, Geng T, Loui A, Zhou T (2023) Tripartite feature enhanced pyramid network for dense prediction. IEEE Trans Image Process 32:2678\u20132692. https:\/\/doi.org\/10.1109\/TIP.2023.3272826","journal-title":"IEEE Trans Image Process"},{"key":"18598_CR49","doi-asserted-by":"publisher","unstructured":"Liu D, Cui Y, Tan W, Chen Y (2021) Sg-net: spatial granularity network for one-stage video instance segmentation. In: 2021 IEEE\/CVF conference on computer vision and pattern recognition (CVPR). https:\/\/doi.org\/10.1109\/cvpr46437.2021.00969","DOI":"10.1109\/cvpr46437.2021.00969"},{"key":"18598_CR50","volume-title":"Tf-blender: temporal feature blender for video object detection","author":"Y Cui","year":"2021","unstructured":"Cui Y, Yan L, Cao Z, Liu D (2021) Tf-blender: temporal feature blender for video object detection. Cornell University - arXiv, Cornell University - arXiv"},{"key":"18598_CR51","unstructured":"Wang W, Liang J, Liu D (2022) Learning equivariant segmentation with instance-unique querying"},{"key":"18598_CR52","doi-asserted-by":"crossref","unstructured":"Shu J, Yuan X, Meng D, Xu Z (2022) Cmw-net: learning a class-aware sample weighting mapping for robust deep learning. CoRR arXiv:2202.05613","DOI":"10.1109\/TPAMI.2023.3271451"},{"key":"18598_CR53","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla NV, Bowyer KW, Hall LO, Kegelmeyer WP (2002) SMOTE: synthetic minority over-sampling technique. J Artif Intell Res 16:321\u2013357. https:\/\/doi.org\/10.1613\/jair.953","journal-title":"J Artif Intell Res"},{"key":"18598_CR54","doi-asserted-by":"crossref","unstructured":"Dong Q, Gong S, Zhu X (2017) Class rectification hard mining for imbalanced deep learning. In: Proceedings of the IEEE International conference on computer vision, pp 1851\u20131860","DOI":"10.1109\/ICCV.2017.205"},{"key":"18598_CR55","doi-asserted-by":"crossref","unstructured":"Zadrozny B (2004) Learning and evaluating classifiers under sample selection bias. In: Proceedings of the twenty-first international conference on machine learning, p 114","DOI":"10.1145\/1015330.1015425"},{"key":"18598_CR56","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"18598_CR57","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.121979","volume":"238","author":"C Yue","year":"2024","unstructured":"Yue C, Huang R, Towey D, Xian Z, Wu G (2024) An entropy-based group decision-making approach for software quality evaluation. Expert Syst Appl 238:121979. https:\/\/doi.org\/10.1016\/j.eswa.2023.121979","journal-title":"Expert Syst Appl"},{"key":"18598_CR58","doi-asserted-by":"crossref","unstructured":"Dubey A, Gupta O, Guo P, Raskar R, Farrell R, Naik N (2018) Pairwise confusion for fine-grained visual classification. In: Proceedings of the European conference on computer vision (ECCV), pp 70\u201386","DOI":"10.1007\/978-3-030-01258-8_5"},{"key":"18598_CR59","doi-asserted-by":"crossref","unstructured":"Yang Z, Luo T, Wang D, Hu Z, Gao J, Wang L (2018) Learning to navigate for fine-grained classification. In: Proceedings of the European conference on computer vision (ECCV), pp 420\u2013435","DOI":"10.1007\/978-3-030-01264-9_26"},{"key":"18598_CR60","doi-asserted-by":"publisher","unstructured":"Wang Y, Morariu VI, Davis LS (2018) Learning a discriminative filter bank within a cnn for fine-grained recognition. In: 2018 IEEE\/CVF Conference on computer vision and pattern recognition, pp 4148\u20134157. https:\/\/doi.org\/10.1109\/CVPR.2018.00436","DOI":"10.1109\/CVPR.2018.00436"},{"key":"18598_CR61","doi-asserted-by":"publisher","first-page":"7006","DOI":"10.1109\/TIP.2020.2996736","volume":"29","author":"K Song","year":"2020","unstructured":"Song K, Wei X, Shu X, Song R, Lu J (2020) Bi-modal progressive mask attention for fine-grained recognition. IEEE Trans Image Process 29:7006\u20137018. https:\/\/doi.org\/10.1109\/TIP.2020.2996736","journal-title":"IEEE Trans Image Process"},{"key":"18598_CR62","doi-asserted-by":"publisher","unstructured":"Li J, Zhu L, Huang Z, Lu K, Zhao J (2018) I read, i saw, i tell: texts assisted fine-grained visual classification. In: Proceedings of the 26th ACM international conference on multimedia. MM \u201918, pp 663\u2013671. Association for Computing Machinery, New York, USA. https:\/\/doi.org\/10.1145\/3240508.3240579","DOI":"10.1145\/3240508.3240579"},{"key":"18598_CR63","doi-asserted-by":"publisher","unstructured":"Wang Y, Choi J, Morariu VI, Davis LS (2016) Mining discriminative triplets of patches for fine-grained classification. In: 2016 IEEE Conference on computer vision and pattern recognition (CVPR), pp 1163\u20131172. https:\/\/doi.org\/10.1109\/CVPR.2016.131","DOI":"10.1109\/CVPR.2016.131"},{"key":"18598_CR64","doi-asserted-by":"publisher","first-page":"704","DOI":"10.1016\/j.patcog.2017.10.002","volume":"76","author":"X Wei","year":"2018","unstructured":"Wei X, Xie C, Wu J, Shen C (2018) Mask-cnn: localizing parts and selecting descriptors for fine-grained bird species categorization. Pattern Recognit 76:704\u2013714. https:\/\/doi.org\/10.1016\/j.patcog.2017.10.002","journal-title":"Pattern Recognit"},{"key":"18598_CR65","doi-asserted-by":"crossref","unstructured":"Zhang C, Lin G, Wang Q, Shen F, Yao Y, Tang Z (2022) Guided by meta-set: a data-driven method for fine-grained visual recognition. IEEE Transactions on Multimedia","DOI":"10.1109\/TMM.2022.3181439"},{"issue":"5","key":"18598_CR66","doi-asserted-by":"publisher","first-page":"749","DOI":"10.1109\/LGRS.2018.2802944","volume":"15","author":"Z Zhang","year":"2018","unstructured":"Zhang Z, Liu Q, Wang Y (2018) Road extraction by deep residual u-net. IEEE Geosci Remote Sensing Lett 15(5):749\u2013753","journal-title":"IEEE Geosci Remote Sensing Lett"},{"key":"18598_CR67","doi-asserted-by":"publisher","first-page":"179656","DOI":"10.1109\/ACCESS.2020.3025372","volume":"8","author":"T Fan","year":"2020","unstructured":"Fan T, Wang G, Li Y, Wang H (2020) Ma-net: a multi-scale attention network for liver and tumor segmentation. IEEE Access 8:179656\u2013179665","journal-title":"IEEE Access"},{"key":"18598_CR68","doi-asserted-by":"crossref","unstructured":"Chaurasia A, Culurciello E (2017) Linknet: exploiting encoder representations for efficient semantic segmentation. In: 2017 IEEE Visual communications and image processing (VCIP), pp 1\u20134. IEEE","DOI":"10.1109\/VCIP.2017.8305148"},{"key":"18598_CR69","unstructured":"Kirillov A, He K, Girshick R, Doll\u00e1r P (2017) A unified architecture for instance and semantic segmentation. In: CVPR"},{"key":"18598_CR70","unstructured":"Li H, Xiong P, An J, Wang L (2018) Pyramid attention network for semantic segmentation. arXiv:1805.10180"},{"key":"18598_CR71","doi-asserted-by":"crossref","unstructured":"Chen L-C, Zhu Y, Papandreou G, Schroff F, Adam H (2018) Encoder-decoder with atrous separable convolution for semantic image segmentation. In: Proceedings of the European conference on computer vision (ECCV), pp 801\u2013818","DOI":"10.1007\/978-3-030-01234-2_49"},{"key":"18598_CR72","unstructured":"Wah C, Branson S, Welinder P, Perona P, Belongie S (2011) The caltech-ucsd birds-200-2011 dataset"},{"key":"18598_CR73","unstructured":"Maji S, Rahtu E, Kannala J, Blaschko MB, Vedaldi A (2013) Fine-grained visual classification of aircraft. arXiv:1306.5151"},{"key":"18598_CR74","unstructured":"Paszke A, Gross S, Chintala S, Chanan G, Yang E, DeVito Z, Lin Z, Desmaison A, Antiga L, Lerer A (2017) Automatic differentiation in pytorch"},{"issue":"3","key":"18598_CR75","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky O, Deng J, Su H, Krause J, Satheesh S, Ma S, Huang Z, Karpathy A, Khosla A, Bernstein MS, Berg AC, Fei-Fei L (2015) Imagenet large scale visual recognition challenge. Int J Comput Vis 115(3):211\u2013252. https:\/\/doi.org\/10.1007\/s11263-015-0816-y","journal-title":"Int J Comput Vis"},{"key":"18598_CR76","doi-asserted-by":"crossref","unstructured":"Zhang H, Cisse M, Dauphin YN, Lopez-Paz D (2017) mixup: beyond empirical risk minimization. arXiv:1710.09412","DOI":"10.1007\/978-1-4899-7687-1_79"},{"key":"18598_CR77","unstructured":"Krizhevsky A, Hinton G et\u00a0al (2009) Learning multiple layers of features from tiny images"},{"key":"18598_CR78","doi-asserted-by":"crossref","unstructured":"Patrini G, Rozza A, Krishna\u00a0Menon A, Nock R, Qu L (2017) Making deep neural networks robust to label noise: a loss correction approach. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 1944\u20131952","DOI":"10.1109\/CVPR.2017.240"},{"key":"18598_CR79","unstructured":"Zhang Z, Sabuncu M (2018) Generalized cross entropy loss for training deep neural networks with noisy labels. Adv Neural Inform Process Syst 31"},{"key":"18598_CR80","unstructured":"Ren M, Zeng W, Yang B, Urtasun R (2018) Learning to reweight examples for robust deep learning. In: International conference on machine learning, pp 4334\u20134343. PMLR"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-024-18598-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-024-18598-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-024-18598-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,7]],"date-time":"2024-10-07T13:29:40Z","timestamp":1728307780000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-024-18598-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,3,2]]},"references-count":80,"journal-issue":{"issue":"33","published-online":{"date-parts":[[2024,10]]}},"alternative-id":["18598"],"URL":"https:\/\/doi.org\/10.1007\/s11042-024-18598-x","relation":{},"ISSN":["1573-7721"],"issn-type":[{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,3,2]]},"assertion":[{"value":"26 October 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 January 2024","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 February 2024","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 March 2024","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of Interest"}}]}}