{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,18]],"date-time":"2025-09-18T10:38:46Z","timestamp":1758191926626,"version":"3.44.0"},"reference-count":51,"publisher":"Springer Science and Business Media LLC","issue":"31","license":[{"start":{"date-parts":[[2024,10,29]],"date-time":"2024-10-29T00:00:00Z","timestamp":1730160000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,10,29]],"date-time":"2024-10-29T00:00:00Z","timestamp":1730160000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100004663","name":"Ministry of Science and Technology, Taiwan","doi-asserted-by":"publisher","award":["MOST 111-2635-M-035 -001 -"],"award-info":[{"award-number":["MOST 111-2635-M-035 -001 -"]}],"id":[{"id":"10.13039\/501100004663","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-024-20359-9","type":"journal-article","created":{"date-parts":[[2024,10,29]],"date-time":"2024-10-29T07:03:36Z","timestamp":1730185416000},"page":"37671-37700","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Enhanced fish species classification using dynamic multilayer perceptron and transformer encoders with extra distribution data"],"prefix":"10.1007","volume":"84","author":[{"given":"Mei-Hsin","family":"Chen","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0007-6354-168X","authenticated-orcid":false,"given":"Ting-Hsuan","family":"Lai","sequence":"additional","affiliation":[]},{"given":"Yao-Chung","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Tien-Yin","family":"Chou","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,10,29]]},"reference":[{"key":"20359_CR1","doi-asserted-by":"crossref","unstructured":"Akata Z, Reed S, Walter D et al (2015) Evaluation of output embeddings for fine-grained image classification. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","DOI":"10.1109\/CVPR.2015.7298911"},{"key":"20359_CR2","doi-asserted-by":"publisher","unstructured":"Behera A, Wharton Z, Hewage PRPG et al (2021) Context-aware attentional pooling (cap) for fine-grained visual classification. Proceedings of the AAAI Conference on Artificial Intelligence 35(2):929\u2013937. https:\/\/doi.org\/10.1609\/aaai.v35i2.16176. https:\/\/ojs.aaai.org\/index.php\/AAAI\/article\/view\/16176","DOI":"10.1609\/aaai.v35i2.16176"},{"key":"20359_CR3","doi-asserted-by":"publisher","DOI":"10.1016\/j.worlddev.2020.105048","volume":"135","author":"J Bronnmann","year":"2020","unstructured":"Bronnmann J, Smith MD, Abbott J et al (2020) Integration of a local fish market in namibia with the global seafood trade: Implications for fish traders and sustainability. World Dev 135:105048. https:\/\/doi.org\/10.1016\/j.worlddev.2020.105048","journal-title":"World Dev"},{"key":"20359_CR4","doi-asserted-by":"publisher","first-page":"4683","DOI":"10.1109\/TIP.2020.2973812","volume":"29","author":"D Chang","year":"2020","unstructured":"Chang D, Ding Y, Xie J et al (2020) The devil is in the channels: Mutual-channel loss for fine-grained image classification. IEEE Trans Image Process 29:4683\u20134695","journal-title":"IEEE Trans Image Process"},{"key":"20359_CR5","unstructured":"Chen T, Li M, Li Y, et\u00a0al (2015) Mxnet: A flexible and efficient machine learning library for heterogeneous distributed systems. arXiv preprint arXiv:1512.01274"},{"key":"20359_CR6","doi-asserted-by":"crossref","unstructured":"Chu G, Potetz B, Wang W, et\u00a0al (2019) Geo-aware networks for fine-grained recognition. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision Workshops","DOI":"10.1109\/ICCVW.2019.00033"},{"issue":"2","key":"20359_CR7","doi-asserted-by":"publisher","first-page":"652","DOI":"10.1109\/TPAMI.2019.2938758","volume":"43","author":"SH Gao","year":"2019","unstructured":"Gao SH, Cheng MM, Zhao K et al (2019) Res2net: A new multi-scale backbone architecture. IEEE Trans Pattern Anal Mach Intell 43(2):652\u2013662","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"20359_CR8","doi-asserted-by":"crossref","unstructured":"Gao Y, Han X, Wang X, et\u00a0al (2020) Channel interaction networks for fine-grained image categorization. In: Proceedings of the AAAI conference on artificial intelligence, pp 10818\u201310825","DOI":"10.1609\/aaai.v34i07.6712"},{"key":"20359_CR9","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, et\u00a0al (2016) Deep residual learning for image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"20359_CR10","doi-asserted-by":"crossref","unstructured":"Huang G, Liu Z, Van Der\u00a0Maaten L, et\u00a0al (2017) Densely connected convolutional networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 4700\u20134708","DOI":"10.1109\/CVPR.2017.243"},{"key":"20359_CR11","doi-asserted-by":"crossref","unstructured":"Huang S, Wang X, Tao D (2021) Snapmix: Semantically proportional mixing for augmenting fine-grained data. In: Proceedings of the AAAI Conference on Artificial Intelligence, pp 1628\u20131636","DOI":"10.1609\/aaai.v35i2.16255"},{"key":"20359_CR12","doi-asserted-by":"crossref","unstructured":"Khalifa NEM, Taha MHN, Hassanien AE (2018) Aquarium family fish species identification system using deep neural networks. In: International Conference on Advanced Intelligent Systems and Informatics, Springer, pp 347\u2013356","DOI":"10.1007\/978-3-319-99010-1_32"},{"key":"20359_CR13","doi-asserted-by":"crossref","unstructured":"Kratzert F, Mader H (2018) Fish species classification in underwater video monitoring using convolutional neural networks. EarthArXiv","DOI":"10.31223\/OSF.IO\/DXWTZ"},{"key":"20359_CR14","doi-asserted-by":"publisher","first-page":"904","DOI":"10.1126\/science.aao5646","volume":"359","author":"D Kroodsma","year":"2018","unstructured":"Kroodsma D, Mayorga J, Hochberg T et al (2018) Tracking the global footprint of fisheries. Sci 359:904\u2013908. https:\/\/doi.org\/10.1126\/science.aao5646","journal-title":"Sci"},{"key":"20359_CR15","doi-asserted-by":"publisher","first-page":"374","DOI":"10.1016\/j.future.2018.10.009","volume":"92","author":"S Lakshmanaprabu","year":"2019","unstructured":"Lakshmanaprabu S, Mohanty SN, Shankar K et al (2019) Optimal deep learning model for classification of lung cancer on ct images. Futur Gener Comput Syst 92:374\u2013382","journal-title":"Futur Gener Comput Syst"},{"key":"20359_CR16","doi-asserted-by":"crossref","unstructured":"Li H, Zhang X, Tian Q, et\u00a0al (2020) Attribute mix: Semantic data augmentation for fine grained recognition. In: 2020 IEEE International Conference on Visual Communications and Image Processing (VCIP), IEEE, pp 243\u2013246","DOI":"10.1109\/VCIP49819.2020.9301763"},{"key":"20359_CR17","doi-asserted-by":"crossref","unstructured":"Li X, Wang W, Hu X, et\u00a0al (2019) Selective kernel networks. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 510\u2013519","DOI":"10.1109\/CVPR.2019.00060"},{"key":"20359_CR18","doi-asserted-by":"crossref","unstructured":"Mac\u00a0Aodha O, Cole E, Perona P (2019) Presence-only geographical priors for fine-grained image classification. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 9596\u20139606","DOI":"10.1109\/ICCV.2019.00969"},{"key":"20359_CR19","unstructured":"Mai G, Janowicz K, Yan B, et\u00a0al (2020) Multi-scale representation learning for spatial feature distributions using grid cells. arXiv preprint arXiv:2003.00824"},{"issue":"9","key":"20359_CR20","doi-asserted-by":"publisher","first-page":"6530","DOI":"10.1109\/TGRS.2019.2906883","volume":"57","author":"R Minetto","year":"2019","unstructured":"Minetto R, Segundo MP, Sarkar S (2019) Hydra: An ensemble of convolutional neural networks for geospatial land classification. IEEE Trans Geosci Remote Sens 57(9):6530\u20136541","journal-title":"IEEE Trans Geosci Remote Sens"},{"key":"20359_CR21","first-page":"82","volume":"3","author":"L Mingwang","year":"2017","unstructured":"Mingwang L (2017) Fish image recognition and separation based on convolutional neural network [j]. Image Multimed Technol 3:82\u201383","journal-title":"Image Multimed Technol"},{"key":"20359_CR22","doi-asserted-by":"crossref","unstructured":"Montalbo FJP, Hernandez AA (2019) Classification of fish species with augmented data using deep convolutional neural network. In: 2019 IEEE 9th International Conference on System Engineering and Technology (ICSET), IEEE, pp 396\u2013401","DOI":"10.1109\/ICSEngT.2019.8906433"},{"issue":"1","key":"20359_CR23","first-page":"222","volume":"35","author":"MH Mozaffari","year":"2016","unstructured":"Mozaffari MH, Abdy H, Zahiri SH (2016) Ipo: an inclined planes system optimization algorithm. Comput Inf 35(1):222\u2013240","journal-title":"Comput Inf"},{"key":"20359_CR24","doi-asserted-by":"publisher","DOI":"10.1093\/ICESJMS\/FSZ036","author":"W Probst","year":"2020","unstructured":"Probst W (2020) How emerging data technologies can increase trust and transparency in fisheries. ICES J Mar Sci. https:\/\/doi.org\/10.1093\/ICESJMS\/FSZ036","journal-title":"ICES J Mar Sci"},{"key":"20359_CR25","doi-asserted-by":"crossref","unstructured":"Rathi D, Jain S, Indu S (2017) Underwater fish species classification using convolutional neural network and deep learning. In: 2017 Ninth international conference on advances in pattern recognition (ICAPR), IEEE, pp 1\u20136","DOI":"10.1109\/ICAPR.2017.8593044"},{"key":"20359_CR26","doi-asserted-by":"crossref","unstructured":"Salem T, Workman S, Jacobs N (2020) Learning a dynamic map of visual appearance. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 12435\u201312444","DOI":"10.1109\/CVPR42600.2020.01245"},{"key":"20359_CR27","doi-asserted-by":"publisher","DOI":"10.1016\/j.ecoinf.2019.100977","volume":"53","author":"AA dos Santos","year":"2019","unstructured":"dos Santos AA, Gon\u00e7alves WN (2019) Improving pantanal fish species recognition through taxonomic ranks in convolutional neural networks. Eco Inform 53:100977","journal-title":"Eco Inform"},{"key":"20359_CR28","unstructured":"Shao KT (2007) Taiwan fish database. www web electronic publication. http:\/\/fishdb.sinica.edu.tw, (2023-7-30)"},{"key":"20359_CR29","unstructured":"Simonyan K, Zisserman A (2014) Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556"},{"key":"20359_CR30","doi-asserted-by":"crossref","unstructured":"Tang K, Paluri M, Fei-Fei L, et\u00a0al (2015) Improving image classification with location context. In: Proceedings of the IEEE international conference on computer vision, pp 1008\u20131016","DOI":"10.1109\/ICCV.2015.121"},{"key":"20359_CR31","doi-asserted-by":"publisher","DOI":"10.1002\/lary.31175","author":"X Tao","year":"2023","unstructured":"Tao X, Zhao X, Liu H et al (2023) Automatic recognition of concealed fish bones under laryngoscopy: A practical ai model based on yolo-v5. Laryngoscope. https:\/\/doi.org\/10.1002\/lary.31175","journal-title":"Laryngoscope"},{"key":"20359_CR32","doi-asserted-by":"crossref","unstructured":"Terry JCD, Roy HE, August TA (2020a) Thinking like a naturalist: Enhancing computer vision of citizen science images by harnessing contextual data. Methods in Ecology and Evolution 11(2):303\u2013315","DOI":"10.1111\/2041-210X.13335"},{"key":"20359_CR33","doi-asserted-by":"crossref","unstructured":"Terry JCD, Roy HE, August TA (2020b) Thinking like a naturalist: Enhancing computer vision of citizen science images by harnessing contextual data. Methods in Ecology and Evolution 11(2):303\u2013315","DOI":"10.1111\/2041-210X.13335"},{"key":"20359_CR34","doi-asserted-by":"publisher","unstructured":"Tomassini M (2010) Cellular evolutionary algorithms pp 167\u2013191. https:\/\/doi.org\/10.1007\/978-3-642-12203-3sps8","DOI":"10.1007\/978-3-642-12203-3sps8"},{"key":"20359_CR35","doi-asserted-by":"crossref","unstructured":"Touvron H, Sablayrolles A, Douze M, et\u00a0al (2021) Grafit: Learning fine-grained image representations with coarse labels. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 874\u2013884","DOI":"10.1109\/ICCV48922.2021.00091"},{"key":"20359_CR36","doi-asserted-by":"crossref","unstructured":"Van\u00a0Horn G, Mac\u00a0Aodha O, Song Y, et\u00a0al (2018) The inaturalist species classification and detection dataset. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 8769\u20138778","DOI":"10.1109\/CVPR.2018.00914"},{"key":"20359_CR37","doi-asserted-by":"crossref","unstructured":"Van\u00a0Horn G, Cole E, Beery S, et\u00a0al (2021) Benchmarking representation learning for natural world image collections. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 12884\u201312893","DOI":"10.1109\/CVPR46437.2021.01269"},{"key":"20359_CR38","unstructured":"Vaswani A, Shazeer N, Parmar N, et\u00a0al (2017) Attention is all you need. Advances in neural information processing systems 30"},{"issue":"1","key":"20359_CR39","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s12859-018-2201-7","volume":"19","author":"HC Wittich","year":"2018","unstructured":"Wittich HC, Seeland M, W\u00e4ldchen J et al (2018) Recommending plant taxa for supporting on-site species identification. BMC Bioinforma 19(1):1\u201317","journal-title":"BMC Bioinforma"},{"key":"20359_CR40","doi-asserted-by":"crossref","unstructured":"Xiao T, Xu Y, Yang K, et\u00a0al (2015) The application of two-level attention models in deep convolutional neural network for fine-grained image classification. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 842\u2013850","DOI":"10.1109\/CVPR.2015.7298685"},{"key":"20359_CR41","doi-asserted-by":"crossref","unstructured":"Xie S, Girshick R, Doll\u00e1r P, et\u00a0al (2017) Aggregated residual transformations for deep neural networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 1492\u20131500","DOI":"10.1109\/CVPR.2017.634"},{"key":"20359_CR42","doi-asserted-by":"crossref","unstructured":"Yang L, Li X, Song R, et\u00a0al (2022) Dynamic mlp for fine-grained image classification by leveraging geographical and temporal information. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 10945\u201310954","DOI":"10.1109\/CVPR52688.2022.01067"},{"key":"20359_CR43","unstructured":"Yang S, Chen B (2023a) Effective surrogate gradient learning with high-order information bottleneck for spike-based machine intelligence. IEEE transactions on neural networks and learning systems"},{"key":"20359_CR44","doi-asserted-by":"crossref","unstructured":"Yang S, Chen B (2023b) Snib: improving spike-based machine learning using nonlinear information bottleneck. IEEE Transactions on Systems, Man, and Cybernetics: Systems","DOI":"10.1109\/TSMC.2023.3300318"},{"key":"20359_CR45","doi-asserted-by":"crossref","unstructured":"Yang S, Wang H, Chen B (2023) Sibols: robust and energy-efficient learning for spike-based machine intelligence in information bottleneck framework. IEEE Transactions on Cognitive and Developmental Systems","DOI":"10.1109\/TCDS.2023.3329532"},{"key":"20359_CR46","doi-asserted-by":"crossref","unstructured":"Yang Z, Luo T, Wang D, et\u00a0al (2018) Learning to navigate for fine-grained classification. In: Proceedings of the European conference on computer vision (ECCV), pp 420\u2013435","DOI":"10.1007\/978-3-030-01264-9_26"},{"key":"20359_CR47","first-page":"17","volume":"13","author":"S Sadeghi-Ivrigh","year":"2015","unstructured":"Sadeghi-Ivrigh S, Yazdani D, Yazdani D et al (2015) Fish swarm search algorithm: A new algorithm for global optimization. Int J artif intell 13:17\u201345","journal-title":"Int J artif intell"},{"key":"20359_CR48","doi-asserted-by":"publisher","unstructured":"Yiu YF, Du J, Mahapatra R (2018) Evolutionary heuristic a* search: Heuristic function optimization via genetic algorithm. 2018 IEEE First International Conference on Artificial Intelligence and Knowledge Engineering (AIKE) pp 25\u201332. https:\/\/doi.org\/10.1109\/AIKE.2018.00012","DOI":"10.1109\/AIKE.2018.00012"},{"key":"20359_CR49","doi-asserted-by":"crossref","unstructured":"Zhang F, Li M, Zhai G, et\u00a0al (2021) Multi-branch and multi-scale attention learning for fine-grained visual categorization. In: MultiMedia Modeling: 27th International Conference, MMM 2021, Prague, Czech Republic, June 22\u201324, 2021, Proceedings, Part I 27, Springer, pp 136\u2013147","DOI":"10.1007\/978-3-030-67832-6_12"},{"key":"20359_CR50","doi-asserted-by":"crossref","unstructured":"Zhang N, Donahue J, Girshick R, et\u00a0al (2014) Part-based r-cnns for fine-grained category detection. In: Computer Vision\u2013ECCV 2014: 13th European Conference, Zurich, Switzerland, September 6-12, 2014, Proceedings, Part I 13, Springer, pp 834\u2013849","DOI":"10.1007\/978-3-319-10590-1_54"},{"key":"20359_CR51","unstructured":"Zheng H, Fu J, Zha ZJ, et\u00a0al (2019) Learning deep bilinear transformation for fine-grained image representation. Advances in Neural Information Processing Systems 32"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-024-20359-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-024-20359-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-024-20359-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,17]],"date-time":"2025-09-17T09:46:17Z","timestamp":1758102377000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-024-20359-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,29]]},"references-count":51,"journal-issue":{"issue":"31","published-online":{"date-parts":[[2025,9]]}},"alternative-id":["20359"],"URL":"https:\/\/doi.org\/10.1007\/s11042-024-20359-9","relation":{},"ISSN":["1573-7721"],"issn-type":[{"type":"electronic","value":"1573-7721"}],"subject":[],"published":{"date-parts":[[2024,10,29]]},"assertion":[{"value":"2 August 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 June 2024","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 October 2024","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 October 2024","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no conflicts of interest to declare that are relevant to the content of this article.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflicts of interest"}}]}}