{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,23]],"date-time":"2026-04-23T03:40:05Z","timestamp":1776915605903,"version":"3.51.2"},"reference-count":45,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2023,9,12]],"date-time":"2023-09-12T00:00:00Z","timestamp":1694476800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,9,12]],"date-time":"2023-09-12T00:00:00Z","timestamp":1694476800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62066035"],"award-info":[{"award-number":["62066035"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004763","name":"Natural Science Foundation of Inner Mongolia","doi-asserted-by":"publisher","award":["2022LHMS06004"],"award-info":[{"award-number":["2022LHMS06004"]}],"id":[{"id":"10.13039\/501100004763","id-type":"DOI","asserted-by":"publisher"}]},{"name":"the basic scientific research business fee project of the universities directly under the Inner Mongolia Autonomous Region","award":["JY20220089"],"award-info":[{"award-number":["JY20220089"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2024,6]]},"DOI":"10.1007\/s00371-023-03075-7","type":"journal-article","created":{"date-parts":[[2023,9,12]],"date-time":"2023-09-12T14:02:15Z","timestamp":1694527335000},"page":"4167-4181","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["IDA: an improved dual attention module for pollen classification"],"prefix":"10.1007","volume":"40","author":[{"given":"Gao","family":"Le","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1107-5679","authenticated-orcid":false,"given":"Shi","family":"Bao","sequence":"additional","affiliation":[]},{"given":"Dezhi","family":"Yang","sequence":"additional","affiliation":[]},{"given":"Kaibo","family":"Duan","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,9,12]]},"reference":[{"issue":"6","key":"3075_CR1","doi-asserted-by":"publisher","first-page":"567","DOI":"10.1111\/j.1398-9995.1998.tb03932.x","volume":"53","author":"G D\u2019amato","year":"1998","unstructured":"D\u2019amato, G., Spieksma, F.T.M., Liccardi, G., et al.: Pollen-related allergy in Europe. Allergy 53(6), 567\u2013578 (1998)","journal-title":"Allergy"},{"key":"3075_CR2","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S. et al.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (pp. 770-778) (2016)","DOI":"10.1109\/CVPR.2016.90"},{"issue":"6","key":"3075_CR3","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1145\/3065386","volume":"60","author":"A Krizhevsky","year":"2017","unstructured":"Krizhevsky, A., Sutskever, I., Hinton, G.E.: Imagenet classification with deep convolutional neural networks. Commun. ACM 60(6), 84\u201390 (2017)","journal-title":"Commun. ACM"},{"key":"3075_CR4","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556 (2014)"},{"key":"3075_CR5","doi-asserted-by":"crossref","unstructured":"He, K., Gkioxari, G., Dollar, P. et al.: Mask r-cnn. In: Proceedings of the IEEE International Conference on Computer Vision (pp. 2961-2969) (2017)","DOI":"10.1109\/ICCV.2017.322"},{"key":"3075_CR6","doi-asserted-by":"publisher","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","volume":"39","author":"S Ren","year":"2017","unstructured":"Ren, S., He, K., Girshick, R., et al.: Faster r-cnn: Towards realtime object detection with region proposal networks. IEEE Trans. Pattern Anal. Mach. Intell. 39, 1137\u20131149 (2017)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"3075_CR7","unstructured":"Vaswani, A., Shazeer, N., Parmar, N. et al.: Attention is all you need. Adv. Neural Inform. Process. Syst. 30 (2017)"},{"key":"3075_CR8","doi-asserted-by":"crossref","unstructured":"Huang, G., Liu, Z., Van Der Maaten, L. et al.: Densely connected convolutional networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (pp. 4700-4708) (2017)","DOI":"10.1109\/CVPR.2017.243"},{"issue":"6","key":"3075_CR9","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1145\/3065386","volume":"60","author":"A Krizhevsky","year":"2017","unstructured":"Krizhevsky, A., Sutskever, I., Hinton, G.E.: Imagenet classification with deep convolutional neural networks. Commun. ACM 60(6), 84\u201390 (2017)","journal-title":"Commun. ACM"},{"key":"3075_CR10","doi-asserted-by":"crossref","unstructured":"Chollet, F.: Xception: Deep learning with depthwise separable convolutions. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (pp. 1251-1258) (2017)","DOI":"10.1109\/CVPR.2017.195"},{"key":"3075_CR11","unstructured":"Howard, A.G., Zhu, M., Chen, B. et al.: Mobilenets: Efficient convolutional neural networks for mobile vision applications. arXiv preprint arXiv:1704.04861 (2017)"},{"key":"3075_CR12","doi-asserted-by":"crossref","unstructured":"Howard, A., Sandler, M., Chu, G. et al.: Searching for mobilenetv3. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (pp. 1314-1324) (2019)","DOI":"10.1109\/ICCV.2019.00140"},{"key":"3075_CR13","unstructured":"Tan, M., Le, Q.: Efficientnet: Rethinking model scaling for convolutional neural networks. In: International Conference on Machine Learning (pp. 6105-6114). PMLR (2019)"},{"key":"3075_CR14","unstructured":"Tan, M., Le, Q.: Efficientnetv2: Smaller models and faster training. In: International Conference on Machine Learning (pp. 10096-10106). PMLR (2021)"},{"key":"3075_CR15","doi-asserted-by":"crossref","unstructured":"Daood, A., Ribeiro, E., Bush, M.: Pollen grain recognition using deep learning. In: International Symposium on Visual Computing (pp. 321-330). Springer, Cham (2016)","DOI":"10.1007\/978-3-319-50835-1_30"},{"key":"3075_CR16","doi-asserted-by":"crossref","unstructured":"de Geus, A.R., Barcelos, C.A.Z., Batista, M.A. et al.: Large-scale pollen recognition with deep learning. In: 2019 27th European Signal Processing Conference (EUSIPCO) (pp. 1-5). IEEE (2019)","DOI":"10.23919\/EUSIPCO.2019.8902735"},{"issue":"9","key":"3075_CR17","doi-asserted-by":"publisher","first-page":"e0201807","DOI":"10.1371\/journal.pone.0201807","volume":"13","author":"V Sevillano","year":"2018","unstructured":"Sevillano, V., Aznarte, J.L.: Improving classification of pollen grain images of the POLEN23E dataset through three different applications of deep learning convolutional neural networks. PLoS ONE 13(9), e0201807 (2018)","journal-title":"PLoS ONE"},{"key":"3075_CR18","doi-asserted-by":"publisher","first-page":"148932","DOI":"10.1016\/j.scitotenv.2021.148932","volume":"796","author":"J Schaefer","year":"2021","unstructured":"Schaefer, J., Milling, M., Schuller, B.W., et al.: Towards automatic airborne pollen monitoring: from commercial devices to operational by mitigating class-imbalance in a deep learning approach. Sci. Total Environ. 796, 148932 (2021)","journal-title":"Sci. Total Environ."},{"key":"3075_CR19","unstructured":"Bahdanau, D., Cho, K., Bengio, Y.: Neural machine translation by jointly learning to align and translate. arXiv preprint arXiv:1409.0473 (2014)"},{"key":"3075_CR20","unstructured":"Hassanin, M., Anwar, S., Radwan, I. et al.: Visual attention methods in deep learning: an in-depth survey. arXiv preprint arXiv:2204.07756 (2022)"},{"key":"3075_CR21","doi-asserted-by":"crossref","unstructured":"Hu, J., Shen, L., Sun, G.: Squeeze-and-excitation networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (pp. 7132-7141) (2018)","DOI":"10.1109\/CVPR.2018.00745"},{"key":"3075_CR22","doi-asserted-by":"crossref","unstructured":"Wang, Q., Wu, B., Zhu, P. et al.: ECA-Net: Efficient channel attention for deep convolutional neural networks. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). IEEE (2020)","DOI":"10.1109\/CVPR42600.2020.01155"},{"key":"3075_CR23","doi-asserted-by":"crossref","unstructured":"Woo, S., Park, J., Lee, J.Y. et al.: Cbam: Convolutional block attention module. In: Proceedings of the European Conference on Computer Vision (ECCV) (pp. 3\u201319) (2018)","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"3075_CR24","doi-asserted-by":"crossref","unstructured":"Li, W., Zhu, X., Gong, S.: Harmonious attention network for person re-identification. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (pp. 2285-2294) (2018)","DOI":"10.1109\/CVPR.2018.00243"},{"key":"3075_CR25","doi-asserted-by":"crossref","unstructured":"Ding, F., Yang, G., Wu, J., et al.: High-order attention networks for medical image segmentation. In: International Conference on Medical Image Computing and Computer-Assisted Intervention (pp. 253-262). Springer, Cham (2020)","DOI":"10.1007\/978-3-030-59710-8_25"},{"key":"3075_CR26","doi-asserted-by":"crossref","unstructured":"Zhao, T., Wu, X.: Pyramid feature attention network for saliency detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (pp. 3085-3094) (2019)","DOI":"10.1109\/CVPR.2019.00320"},{"key":"3075_CR27","doi-asserted-by":"crossref","unstructured":"Li, C., Du, D., Zhang, L. et al.: Spatial attention pyramid network for unsupervised domain adaptation. In: European Conference on Computer Vision (pp. 481-497). Springer, Cham (2020)","DOI":"10.1007\/978-3-030-58601-0_29"},{"key":"3075_CR28","doi-asserted-by":"crossref","unstructured":"Meng, Z., Ma, J., Yuan, X.: End-to-end low cost compressive spectral imaging with spatial-spectral self-attention. In: European Conference on Computer Vision (pp. 187-204). Springer, Cham (2020)","DOI":"10.1007\/978-3-030-58592-1_12"},{"key":"3075_CR29","unstructured":"Park, J., Woo, S., Lee, J.Y. et al.: Bam: Bottleneck attention module. arXiv preprint arXiv:1807.06514 (2018)"},{"key":"3075_CR30","doi-asserted-by":"crossref","unstructured":"Liu, H., Liu, F., Fan, X. et al.: Polarized self-attention: towards high-quality pixel-wise regression. arXiv preprint arXiv:2107.00782 (2021)","DOI":"10.1016\/j.neucom.2022.07.054"},{"key":"3075_CR31","doi-asserted-by":"crossref","unstructured":"Chen, M., Wang, P., Shang, D., Wang, P.: Cycle-attention-derain: unsupervised rain removal with CycleGAN. V. Comput. 1-13 (2023)","DOI":"10.1007\/s00371-023-02947-2"},{"issue":"9\u201310","key":"3075_CR32","doi-asserted-by":"publisher","first-page":"3163","DOI":"10.1007\/s00371-022-02535-w","volume":"38","author":"Z Ma","year":"2022","unstructured":"Ma, Z., Yuan, M., Gu, J., Meng, W., Xu, S., Zhang, X.: Triple-strip attention mechanism-based natural disaster images classification and segmentation. Vis. Comput. 38(9\u201310), 3163\u20133173 (2022)","journal-title":"Vis. Comput."},{"issue":"2","key":"3075_CR33","doi-asserted-by":"publisher","first-page":"1489","DOI":"10.1109\/TPAMI.2022.3164083","volume":"45","author":"Y Li","year":"2022","unstructured":"Li, Y., Yao, T., Pan, Y., et al.: Contextual transformer networks for visual recognition. IEEE Trans. Pattern Anal. Mach. Intell. 45(2), 1489 (2022)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"3075_CR34","unstructured":"Goyal, A., Bochkovskiy, A., Deng, J. et al.: Non-deep networks. arXiv preprint arXiv:2110.07641 (2021)"},{"key":"3075_CR35","doi-asserted-by":"crossref","unstructured":"Cao, Y., Xu, J., Lin, S. et al.: Gcnet: Non-local networks meet squeeze-excitation networks and beyond. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision Workshops (pp. 0-0) (2019)","DOI":"10.1109\/ICCVW.2019.00246"},{"key":"3075_CR36","doi-asserted-by":"crossref","unstructured":"Zhang, Q.L., Yang, Y.B.: Sa-net: Shuffle attention for deep convolutional neural networks. In: ICASSP 2021-2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP) (pp. 2235-2239). IEEE (2021)","DOI":"10.1109\/ICASSP39728.2021.9414568"},{"key":"3075_CR37","doi-asserted-by":"crossref","unstructured":"Yu, T., Li, X., Cai, Y. et al.: S $$^ 2$$-MLPv2: Improved spatial-shift MLP architecture for vision. arXiv preprint arXiv:2108.01072 (2021)","DOI":"10.1109\/WACV51458.2022.00367"},{"key":"3075_CR38","first-page":"3965","volume":"34","author":"Z Dai","year":"2021","unstructured":"Dai, Z., Liu, H., Le, Q.V., et al.: Coatnet: marrying convolution and attention for all data sizes. Adv. Neural. Inf. Process. Syst. 34, 3965\u20133977 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"3075_CR39","unstructured":"Wang, W., Yao, L., Chen, L. et al.: Crossformer: A versatile vision transformer hinging on cross-scale attention. arXiv preprint arXiv:2108.00154 (2021)"},{"key":"3075_CR40","unstructured":"Kingma, D.P., Ba, J.: Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980 (2014)"},{"key":"3075_CR41","doi-asserted-by":"crossref","unstructured":"Radosavovic, I., Kosaraju, R.P., Girshick, R. et al.: Designing network design spaces. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (pp. 10428-10436) (2020)","DOI":"10.1109\/CVPR42600.2020.01044"},{"key":"3075_CR42","unstructured":"Dosovitskiy, A., Beyer, L., Kolesnikov, A. et al.: An image is worth 16x16 words: transformers for image recognition at scale. arXiv preprint arXiv:2010.11929 (2020)"},{"key":"3075_CR43","doi-asserted-by":"crossref","unstructured":"Liu, Z., Lin, Y., Cao, Y. et al.: Swin transformer: Hierarchical vision transformer using shifted windows. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (pp. 10012-10022) (2021)","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"3075_CR44","doi-asserted-by":"crossref","unstructured":"Wu, H., Xiao, B., Codella, N. et al.: Cvt: Introducing convolutions to vision transformers. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (pp. 22\u201331) (2021)","DOI":"10.1109\/ICCV48922.2021.00009"},{"key":"3075_CR45","doi-asserted-by":"crossref","unstructured":"Selvaraju, R.R., Cogswell, M., Das, A. et al.: Grad-cam: Visual explanations from deep networks via gradient-based localization. In: Proceedings of the IEEE International Conference on Computer Vision (pp. 618-626) (2017)","DOI":"10.1109\/ICCV.2017.74"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-023-03075-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-023-03075-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-023-03075-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,6,6]],"date-time":"2024-06-06T11:08:02Z","timestamp":1717672082000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-023-03075-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,9,12]]},"references-count":45,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2024,6]]}},"alternative-id":["3075"],"URL":"https:\/\/doi.org\/10.1007\/s00371-023-03075-7","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"value":"0178-2789","type":"print"},{"value":"1432-2315","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,9,12]]},"assertion":[{"value":"21 August 2023","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 September 2023","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}