{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,21]],"date-time":"2026-03-21T21:45:55Z","timestamp":1774129555824,"version":"3.50.1"},"publisher-location":"Singapore","reference-count":45,"publisher":"Springer Nature Singapore","isbn-type":[{"value":"9789819620531","type":"print"},{"value":"9789819620548","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-981-96-2054-8_27","type":"book-chapter","created":{"date-parts":[[2025,1,2]],"date-time":"2025-01-02T15:47:25Z","timestamp":1735832845000},"page":"362-372","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Enhancing Environmental Monitoring Through Multispectral Imaging: The WasteMS Dataset for Semantic Segmentation of Lakeside Waste"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0002-4847-3555","authenticated-orcid":false,"given":"Qinfeng","family":"Zhu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-9318-823X","authenticated-orcid":false,"given":"Ningxin","family":"Weng","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5538-4684","authenticated-orcid":false,"given":"Lei","family":"Fan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7005-5870","authenticated-orcid":false,"given":"Yuanzhi","family":"Cai","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,1,3]]},"reference":[{"key":"27_CR1","doi-asserted-by":"publisher","first-page":"2673","DOI":"10.3390\/rs14112673","volume":"14","author":"Y Cai","year":"2022","unstructured":"Cai, Y., Fan, L., Zhang, C.: Semantic segmentation of multispectral images via linear compression of bands: an experiment using RIT-18. Remote Sens. 14, 2673 (2022)","journal-title":"Remote Sens."},{"key":"27_CR2","doi-asserted-by":"publisher","first-page":"60","DOI":"10.1016\/j.isprsjprs.2018.04.014","volume":"145","author":"R Kemker","year":"2018","unstructured":"Kemker, R., Salvaggio, C., Kanan, C.: Algorithms for semantic segmentation of multispectral remote sensing imagery using deep learning. ISPRS J. Photogramm. Remote Sens. 145, 60\u201377 (2018)","journal-title":"ISPRS J. Photogramm. Remote Sens."},{"key":"27_CR3","doi-asserted-by":"publisher","first-page":"7589","DOI":"10.1109\/JSTARS.2022.3203145","volume":"15","author":"I Ulku","year":"2022","unstructured":"Ulku, I., Akag\u00fcnd\u00fcz, E., Ghamisi, P.: Deep semantic segmentation of trees using multispectral images. IEEE J. Sel. Top. Appl. Earth Obs. Remote Sens. 15, 7589\u20137604 (2022)","journal-title":"IEEE J. Sel. Top. Appl. Earth Obs. Remote Sens."},{"key":"27_CR4","doi-asserted-by":"publisher","first-page":"1215","DOI":"10.3390\/su15021215","volume":"15","author":"Z Wang","year":"2023","unstructured":"Wang, Z., Wang, C., Liu, Y., Wang, J., Qiu, Y.: Real-time identification of cyanobacteria blooms in lakeshore zone using camera and semantic segmentation: a case study of Lake Chaohu (Eastern China). Sustainability 15, 1215 (2023)","journal-title":"Sustainability"},{"key":"27_CR5","doi-asserted-by":"publisher","first-page":"965","DOI":"10.3390\/rs13050965","volume":"13","author":"M Kraft","year":"2021","unstructured":"Kraft, M., Piechocki, M., Ptak, B., Walas, K.: Autonomous, onboard vision-based trash and litter detection in low altitude aerial images collected by an unmanned aerial vehicle. Remote Sens. 13, 965 (2021)","journal-title":"Remote Sens."},{"key":"27_CR6","volume":"35","author":"K Bansal","year":"2024","unstructured":"Bansal, K., Tripathi, A.K.: WasteNet: a novel multi-scale attention-based U-Net architecture for waste detection in UAV images. Remote Sens. Appl. Soc. Environ. 35, 101220 (2024)","journal-title":"Remote Sens. Appl. Soc. Environ."},{"key":"27_CR7","doi-asserted-by":"publisher","first-page":"722","DOI":"10.1109\/TGRS.2008.2010457","volume":"47","author":"JA Berni","year":"2009","unstructured":"Berni, J.A., Zarco-Tejada, P.J., Su\u00e1rez, L., Fereres, E.: Thermal and narrowband multispectral remote sensing for vegetation monitoring from an unmanned aerial vehicle. IEEE Trans. Geosci. Remote Sens. 47, 722\u2013738 (2009)","journal-title":"IEEE Trans. Geosci. Remote Sens."},{"key":"27_CR8","doi-asserted-by":"crossref","unstructured":"Ebona, J.M.: Waste management study in the Lake Buhi periphery, Buhi, Camarines sur, Philippines (2019)","DOI":"10.2495\/WS190271"},{"key":"27_CR9","first-page":"3523","volume":"44","author":"S Minaee","year":"2021","unstructured":"Minaee, S., Boykov, Y., Porikli, F., Plaza, A., Kehtarnavaz, N., Terzopoulos, D.: Image segmentation using deep learning: a survey. IEEE Trans. Pattern Anal. Mach. Intell. 44, 3523\u20133542 (2021)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"27_CR10","doi-asserted-by":"publisher","first-page":"1243","DOI":"10.1049\/ipr2.12419","volume":"16","author":"R Wang","year":"2022","unstructured":"Wang, R., Lei, T., Cui, R., Zhang, B., Meng, H., Nandi, A.K.: Medical image segmentation using deep learning: a survey. IET Image Proc. 16, 1243\u20131267 (2022)","journal-title":"IET Image Proc."},{"key":"27_CR11","doi-asserted-by":"crossref","unstructured":"Zhu, Q., et al.: Samba: semantic segmentation of remotely sensed images with state space model. Heliyon (2024)","DOI":"10.1016\/j.heliyon.2024.e38495"},{"key":"27_CR12","doi-asserted-by":"crossref","unstructured":"Ma, X., Zhang, X., Ding, X., Pun, M.-O., Ma, S.: Frequency decomposition-driven unsupervised domain adaptation for remote sensing image semantic segmentation. arXiv preprint arXiv:2404.04531 (2024)","DOI":"10.36227\/techrxiv.23730678.v1"},{"key":"27_CR13","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1016\/j.inffus.2022.06.003","volume":"86","author":"Y Himeur","year":"2022","unstructured":"Himeur, Y., Rimal, B., Tiwary, A., Amira, A.: Using artificial intelligence and data fusion for environmental monitoring: a review and future perspectives. Inf. Fusion 86, 44\u201375 (2022)","journal-title":"Inf. Fusion"},{"key":"27_CR14","unstructured":"Dosovitskiy, A., et al.: An image is worth 16x16 words: transformers for image recognition at scale. arXiv preprint arXiv:2010.11929 (2020)"},{"key":"27_CR15","doi-asserted-by":"crossref","unstructured":"Ma, X., Zhang, X., Pun, M.-O., Liu, M.: A multilevel multimodal fusion transformer for remote sensing semantic segmentation. IEEE Transactions on Geoscience and Remote Sensing (2024)","DOI":"10.1109\/TGRS.2024.3373033"},{"key":"27_CR16","unstructured":"Gu, A., Dao, T.: Mamba: linear-time sequence modeling with selective state spaces. arXiv preprint arXiv:2312.00752 (2023)"},{"key":"27_CR17","unstructured":"Zhu, L., Liao, B., Zhang, Q., Wang, X., Liu, W., Wang, X.: Vision mamba: efficient visual representation learning with bidirectional state space model. arXiv preprint arXiv:2401.09417 (2024)"},{"key":"27_CR18","unstructured":"Liu, Y., et al.: Vmamba: Visual state space model. arXiv preprint arXiv:2401.10166 (2024)"},{"key":"27_CR19","unstructured":"Peng, B., et al.: RWKV: reinventing RNNs for the transformer era. arXiv preprint arXiv:2305.13048 (2023)"},{"key":"27_CR20","unstructured":"Duan, Y., et al.: Vision-RWKV: efficient and scalable visual perception with RWKV-like architectures. arXiv preprint arXiv:2403.02308 (2024)"},{"key":"27_CR21","unstructured":"Beck, M., et al.: xLSTM: extended long short-term memory. arXiv preprint arXiv:2405.04517 (2024)"},{"key":"27_CR22","unstructured":"Alkin, B., Beck, M., P\u00f6ppel, K., Hochreiter, S., Brandstetter, J.: Vision-LSTM: xLSTM as generic vision backbone. arXiv preprint arXiv:2406.04303 (2024)"},{"key":"27_CR23","doi-asserted-by":"crossref","unstructured":"Zhu, Q., Cai, Y., Fan, L.: Seg-LSTM: performance of xLSTM for semantic segmentation of remotely sensed images. arXiv preprint arXiv:2406.14086 (2024)","DOI":"10.1016\/j.heliyon.2024.e38495"},{"key":"27_CR24","doi-asserted-by":"crossref","unstructured":"Zhu, Q., Fang, Y., Cai, Y., Chen, C., Fan, L.: Rethinking scanning strategies with vision mamba in semantic segmentation of remote sensing imagery: an experimental study. IEEE J. Sel. Top. Appl. Earth Obs. Remote Sens. (2024)","DOI":"10.1109\/JSTARS.2024.3472296"},{"key":"27_CR25","doi-asserted-by":"publisher","DOI":"10.1016\/j.rse.2019.111511","volume":"237","author":"L Zeng","year":"2020","unstructured":"Zeng, L., Wardlow, B.D., Xiang, D., Hu, S., Li, D.: A review of vegetation phenological metrics extraction using time-series, multispectral satellite data. Remote Sens. Environ. 237, 111511 (2020)","journal-title":"Remote Sens. Environ."},{"key":"27_CR26","doi-asserted-by":"crossref","unstructured":"Kirillov, A., et al.: Segment anything. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 4015\u20134026. (2023)","DOI":"10.1109\/ICCV51070.2023.00371"},{"key":"27_CR27","doi-asserted-by":"publisher","first-page":"302","DOI":"10.1016\/j.neucom.2019.11.118","volume":"406","author":"S Hao","year":"2020","unstructured":"Hao, S., Zhou, Y., Guo, Y.: A brief survey on semantic segmentation with deep learning. Neurocomputing 406, 302\u2013321 (2020)","journal-title":"Neurocomputing"},{"key":"27_CR28","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L.-J., Li, K., Fei-Fei, L.: ImageNet: a large-scale hierarchical image database. In: 2009 IEEE Conference on Computer Vision and Pattern Recognition, pp. 248\u2013255. IEEE (2009)","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"27_CR29","unstructured":"Krizhevsky, A., Sutskever, I., Hinton, G.E.: Imagenet classification with deep convolutional neural networks. Adv. Neural inf. Process. Syst. 25 (2012)"},{"key":"27_CR30","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"27_CR31","doi-asserted-by":"crossref","unstructured":"Liu, Z., Mao, H., Wu, C.-Y., Feichtenhofer, C., Darrell, T., Xie, S.: A convnet for the 2020s. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 11976\u201311986. (2022)","DOI":"10.1109\/CVPR52688.2022.01167"},{"key":"27_CR32","doi-asserted-by":"crossref","unstructured":"Liu, Z., et al.: Swin transformer: hierarchical vision transformer using shifted windows. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 10012\u201310022 (2021)","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"27_CR33","doi-asserted-by":"crossref","unstructured":"Long, J., Shelhamer, E., Darrell, T.: Fully convolutional networks for semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3431\u20133440 (2015)","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"27_CR34","doi-asserted-by":"crossref","unstructured":"Zhao, H., Shi, J., Qi, X., Wang, X., Jia, J.: Pyramid scene parsing network. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2881\u20132890 (2017)","DOI":"10.1109\/CVPR.2017.660"},{"key":"27_CR35","doi-asserted-by":"publisher","first-page":"834","DOI":"10.1109\/TPAMI.2017.2699184","volume":"40","author":"L-C Chen","year":"2017","unstructured":"Chen, L.-C., Papandreou, G., Kokkinos, I., Murphy, K., Yuille, A.L.: DeepLab: semantic image segmentation with deep convolutional nets, atrous convolution, and fully connected crfs. IEEE Trans. Pattern Anal. Mach. Intell. 40, 834\u2013848 (2017)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"27_CR36","doi-asserted-by":"crossref","unstructured":"Chen, L.-C., Zhu, Y., Papandreou, G., Schroff, F., Adam, H.: Encoder-decoder with atrous separable convolution for semantic image segmentation. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 801\u2013818 (2018)","DOI":"10.1007\/978-3-030-01234-2_49"},{"key":"27_CR37","doi-asserted-by":"crossref","unstructured":"Xiao, T., Liu, Y., Zhou, B., Jiang, Y., Sun, J.: Unified perceptual parsing for scene understanding. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 418\u2013434 (2018)","DOI":"10.1007\/978-3-030-01228-1_26"},{"key":"27_CR38","doi-asserted-by":"crossref","unstructured":"Zhu, Q., Fan, L., Weng, N.: Advancements in point cloud data augmentation for deep learning: a survey. Pattern Recogn. 153, 110532 (2024)","DOI":"10.1016\/j.patcog.2024.110532"},{"key":"27_CR39","doi-asserted-by":"publisher","first-page":"1745","DOI":"10.1109\/TIP.2022.3199107","volume":"32","author":"B Li","year":"2022","unstructured":"Li, B., et al.: Dense nested attention network for infrared small target detection. IEEE Trans. Image Process. 32, 1745\u20131758 (2022)","journal-title":"IEEE Trans. Image Process."},{"key":"27_CR40","first-page":"1","volume":"61","author":"D Wang","year":"2022","unstructured":"Wang, D., Zhang, J., Du, B., Xia, G.-S., Tao, D.: An empirical study of remote sensing pretraining. IEEE Trans. Geosci. Remote Sens. 61, 1\u201320 (2022)","journal-title":"IEEE Trans. Geosci. Remote Sens."},{"key":"27_CR41","doi-asserted-by":"publisher","first-page":"1367","DOI":"10.3390\/rs13071367","volume":"13","author":"Y Cai","year":"2021","unstructured":"Cai, Y., Huang, H., Wang, K., Zhang, C., Fan, L., Guo, F.: Selecting optimal combination of data channels for semantic segmentation in city information modelling (CIM). Remote Sens. 13, 1367 (2021)","journal-title":"Remote Sens."},{"key":"27_CR42","unstructured":"Goodfellow, I., et al.: Generative adversarial nets. Adv. Neural Inf. Process. Syst. 27 (2014)"},{"key":"27_CR43","doi-asserted-by":"crossref","unstructured":"Rombach, R., Blattmann, A., Lorenz, D., Esser, P., Ommer, B.: High-resolution image synthesis with latent diffusion models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10684\u201310695 (2022)","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"27_CR44","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40537-019-0197-0","volume":"6","author":"C Shorten","year":"2019","unstructured":"Shorten, C., Khoshgoftaar, T.M.: A survey on image data augmentation for deep learning. J. Big Data 6, 1\u201348 (2019)","journal-title":"J. Big Data"},{"key":"27_CR45","unstructured":"Zhu, Q., Cao, J., Cai, Y., Fan, L.: Evaluating the impact of point cloud colorization on semantic segmentation accuracy. arXiv preprint arXiv:2410.06725 (2024)"}],"container-title":["Lecture Notes in Computer Science","MultiMedia Modeling"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-96-2054-8_27","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,23]],"date-time":"2025-03-23T01:42:11Z","timestamp":1742694131000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-96-2054-8_27"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9789819620531","9789819620548"],"references-count":45,"URL":"https:\/\/doi.org\/10.1007\/978-981-96-2054-8_27","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"3 January 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"MMM","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Multimedia Modeling","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Nara","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Japan","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"9 January 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"11 January 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"31","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"mmm2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/mmm2025.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}