{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,22]],"date-time":"2026-03-22T22:54:21Z","timestamp":1774220061144,"version":"3.50.1"},"reference-count":44,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2026,2,16]],"date-time":"2026-02-16T00:00:00Z","timestamp":1771200000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,2,16]],"date-time":"2026-02-16T00:00:00Z","timestamp":1771200000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"QUTJBZ Program","award":["No. 2025ZDZX17"],"award-info":[{"award-number":["No. 2025ZDZX17"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["SIViP"],"published-print":{"date-parts":[[2026,3]]},"DOI":"10.1007\/s11760-026-05146-3","type":"journal-article","created":{"date-parts":[[2026,2,16]],"date-time":"2026-02-16T23:06:52Z","timestamp":1771283212000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["WTSNet: An accurate stereo matching network based on wavelet transform and superpixel segmentation"],"prefix":"10.1007","volume":"20","author":[{"ORCID":"https:\/\/orcid.org\/0009-0007-5856-8984","authenticated-orcid":false,"given":"Haiming","family":"Qu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9999-1542","authenticated-orcid":false,"given":"Yunhui","family":"Luo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Guiling","family":"Hu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chongbao","family":"Zhao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Minxuan","family":"He","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mingyu","family":"Shang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qianqian","family":"Xu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,2,16]]},"reference":[{"issue":"11","key":"5146_CR1","doi-asserted-by":"publisher","first-page":"2274","DOI":"10.1109\/TPAMI.2012.120","volume":"34","author":"R Achanta","year":"2012","unstructured":"Achanta, R., Shaji, A., Smith, K., Lucchi, A., Fua, P., S\u00fcsstrunk, S.: SLIC superpixels compared to state-of-the-art superpixel methods. IEEE Trans. Pattern Anal. Mach. Intell. 34(11), 2274\u20132282 (2012). https:\/\/doi.org\/10.1109\/TPAMI.2012.120","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"5146_CR2","doi-asserted-by":"publisher","unstructured":"Chang, J.R., Chen, Y.S.: Pyramid stereo matching network. In: Proc. IEEE Conf. Comput. Vis. Pattern Recognit. (CVPR), pp. 5410\u20135418. IEEE, Salt Lake City, UT, USA (2018). https:\/\/doi.org\/10.1109\/CVPR.2018.00567","DOI":"10.1109\/CVPR.2018.00567"},{"issue":"1","key":"5146_CR3","doi-asserted-by":"crossref","first-page":"567","DOI":"10.1038\/s41598-024-84405-0","volume":"15","author":"W Chen","year":"2025","unstructured":"Chen, W., Liu, Y., Zhang, S., Zhou, M., Li, X.: A cross-domain adaptation and transfer learning network for stereo matching (ct-net). Sci. Rep. 15(1), 567 (2025)","journal-title":"Sci. Rep."},{"key":"5146_CR4","unstructured":"Chen, Z., Zhang, Y., Li, W., Wang, B., Zhao, Y., Chen, C.: Motif channel opened in a white-box: Stereo matching via motif correlation graph. arXiv preprint arXiv:2411.12426 (2024)"},{"key":"5146_CR5","unstructured":"Cheng, J., Liao, W., Cai, Z., Liu, L., Xu, G., Wang, X., Wang, Y., Yuan, Z., Deng, Y., Zang, J., Shi, Y., Tang, J., Yang, X.: Monster++: Unified stereo matching, multi-view stereo, and real-time stereo with monodepth priors. arXiv preprint (2025). https:\/\/github.com\/Junda24\/MonSter-plusplus. Submitted on 15 July 2025"},{"key":"5146_CR6","doi-asserted-by":"crossref","unstructured":"Cheng, J., Liu, L., Xu, G., Wang, X., Zhang, Z., Deng, Y., Zang, J., Chen, Y., Cai, Z., Yang, X.: Monster: Marry monodepth to stereo unleashes power. arXiv preprint arXiv:2501.08643 (2025)","DOI":"10.1109\/CVPR52734.2025.00588"},{"key":"5146_CR7","unstructured":"Cheng, X., Wang, P., Guan, C., Yang, R.: Leastereo: Learned stereo matching in neural architecture search. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 7986\u20137995 (2020)"},{"issue":"1","key":"5146_CR8","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s13640-021-00551-9","volume":"2021","author":"A Emlek","year":"2021","unstructured":"Emlek, A., Peker, M.: Refinement of matching costs for stereo disparities using recurrent neural networks. EURASIP Journal on Image and Video Processing 2021(1), 1\u201315 (2021)","journal-title":"EURASIP Journal on Image and Video Processing"},{"issue":"4","key":"5146_CR9","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3197517.3201386","volume":"37","author":"S Fujieda","year":"2018","unstructured":"Fujieda, S., Takayama, K., Hachisuka, T.: Wavelet convolutional neural networks for texture classification. ACM Transactions on Graphics 37(4), 1\u201311 (2018). https:\/\/doi.org\/10.1145\/3197517.3201386. (SIGGRAPH 2018 Technical Paper)","journal-title":"ACM Transactions on Graphics"},{"key":"5146_CR10","doi-asserted-by":"publisher","unstructured":"Geiger, A., Lenz, P., Urtasun, R.: Are we ready for autonomous driving? the KITTI vision benchmark suite. In: Proc. IEEE Conf. Comput. Vis. Pattern Recognit. (CVPR), pp. 3354\u20133361. IEEE, Providence, RI, USA (2012). https:\/\/doi.org\/10.1109\/CVPR.2012.6248074","DOI":"10.1109\/CVPR.2012.6248074"},{"key":"5146_CR11","doi-asserted-by":"publisher","unstructured":"Guan, T., Guo, J., Wang, C., Liu, Y.H.: Bridgedepth: Bridging monocular and stereo reasoning with latent alignment. arXiv preprint arXiv:2308.04611 (2025). https:\/\/doi.org\/10.48550\/arXiv.2508.04611. ICCV 2025 Highlight","DOI":"10.48550\/arXiv.2508.04611"},{"key":"5146_CR12","doi-asserted-by":"publisher","unstructured":"Guo, X., Yang, K., Yang, W., Wang, X., Li, H.: Group-wise correlation stereo network. In: Proc. IEEE\/CVF Conf. Comput. Vis. Pattern Recognit. (CVPR), pp. 3273\u20133282. IEEE, Long Beach, CA, USA (2019). https:\/\/doi.org\/10.1109\/CVPR.2019.00337","DOI":"10.1109\/CVPR.2019.00337"},{"key":"5146_CR13","doi-asserted-by":"crossref","unstructured":"Han, L., Liu, Z., Lian, S.: Tp3m: Transformer-based pseudo 3d image matching with reference image. arXiv preprint arXiv:2405.08434 (2024)","DOI":"10.1109\/ICRA57147.2024.10610556"},{"key":"5146_CR14","doi-asserted-by":"publisher","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 770\u2013778. Las Vegas, NV, USA (2016). https:\/\/doi.org\/10.1109\/CVPR.2016.90. https:\/\/openaccess.thecvf.com\/content_cvpr_2016\/html\/He_Deep_Residual_Learning_CVPR_2016_paper.html","DOI":"10.1109\/CVPR.2016.90"},{"issue":"2","key":"5146_CR15","doi-asserted-by":"publisher","first-page":"328","DOI":"10.1109\/TPAMI.2007.1166","volume":"30","author":"H Hirschm\u00fcller","year":"2008","unstructured":"Hirschm\u00fcller, H.: Stereo processing by semiglobal matching and mutual information. IEEE Trans. Pattern Anal. Mach. Intell. 30(2), 328\u2013341 (2008). https:\/\/doi.org\/10.1109\/TPAMI.2007.1166","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"5146_CR16","doi-asserted-by":"crossref","unstructured":"Jiang, H., Lou, Z., Ding, L., Xu, R., Tan, M., Jiang, W., Huang, R.: Defom-stereo: Depth foundation model based stereo matching. arXiv preprint arXiv:2501.00026 (2024)","DOI":"10.1109\/CVPR52734.2025.02036"},{"key":"5146_CR17","doi-asserted-by":"crossref","unstructured":"Karpur, A., Perrotta, G., Martin-Brualla, R., Zhou, H., Araujo, A.: Lfm-3d: Learnable feature matching across wide baselines using 3d signals. arXiv preprint arXiv:2303.12779 (2023)","DOI":"10.1109\/3DV62453.2024.00079"},{"key":"5146_CR18","doi-asserted-by":"crossref","unstructured":"Kendall, A., Martirosyan, H., Dasgupta, S., Henry, P., Kennedy, R., Bachrach, A., Bry, A.: End-to-end learning of geometry and context for deep stereo regression. In: Proc. IEEE Int. Conf. Comput. Vis. (ICCV), pp. 66\u201375. IEEE, Venice, Italy (2017)","DOI":"10.1109\/ICCV.2017.17"},{"key":"5146_CR19","unstructured":"Kingma, D.P., Ba, J.: Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980 (2014)"},{"issue":"1","key":"5146_CR20","doi-asserted-by":"crossref","first-page":"7890","DOI":"10.1038\/s41598-024-56452-0","volume":"14","author":"J Li","year":"2024","unstructured":"Li, J., Wang, K., Sun, H., Zhao, Q.: Superpixel-edge-aware stereo matching (edgestereo). Sci. Rep. 14(1), 7890 (2024)","journal-title":"Sci. Rep."},{"key":"5146_CR21","doi-asserted-by":"crossref","unstructured":"Li, J., Wang, P., Xiong, P., Cai, T., Yan, Z., Yang, L., Liu, J., Fan, H., Liu, S.: Practical stereo matching via cascaded recurrent network with adaptive correlation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 16263\u201316272 (2022)","DOI":"10.1109\/CVPR52688.2022.01578"},{"issue":"2","key":"5146_CR22","doi-asserted-by":"publisher","first-page":"336","DOI":"10.1007\/s11390-024-3414-z","volume":"39","author":"Z Li","year":"2024","unstructured":"Li, Z., Chen, X., Guo, S., Wang, S., Pun, C.: Wavenhancer: Unifying wavelet and transformer for image enhancement. J. Comput. Sci. Technol. 39(2), 336\u2013345 (2024). https:\/\/doi.org\/10.1007\/s11390-024-3414-z","journal-title":"J. Comput. Sci. Technol."},{"key":"5146_CR23","doi-asserted-by":"publisher","unstructured":"Li, Z., Liu, X., Drenkow, N., Garg, R., Reid, I., Le, H.: Revisiting stereo depth estimation from a sequence-to-sequence perspective with transformers. In: Proc. IEEE Int. Conf. Comput. Vis. (ICCV), pp. 6197\u20136206. IEEE, Montreal, Canada (2021). https:\/\/doi.org\/10.1109\/ICCV48922.2021.00616","DOI":"10.1109\/ICCV48922.2021.00616"},{"key":"5146_CR24","doi-asserted-by":"publisher","unstructured":"Lin, T.Y., Doll\u00e1r, P., Girshick, R., He, K., Hariharan, B., Belongie, S.: Feature pyramid networks for object detection. In: Proc. IEEE Conf. Comput. Vis. Pattern Recognit. (CVPR), pp. 2117\u20132125. IEEE, Honolulu, HI, USA (2017). https:\/\/doi.org\/10.1109\/CVPR.2017.106","DOI":"10.1109\/CVPR.2017.106"},{"key":"5146_CR25","doi-asserted-by":"crossref","unstructured":"Lipson, L., Teed, Z., Deng, J.: Raft-stereo: Multilevel recurrent field transforms for stereo matching. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 6186\u20136195 (2021)","DOI":"10.1109\/3DV53792.2021.00032"},{"key":"5146_CR26","doi-asserted-by":"publisher","unstructured":"Liu, P., Zhang, H., Lian, W., Zuo, W.: Multi-level wavelet-cnn for image restoration. IEEE Access 7, 74973\u201374985 (2019). https:\/\/doi.org\/10.1109\/ACCESS.2019.2921451. https:\/\/ieeexplore.ieee.org\/document\/8739239. Early arXiv version: arXiv:1907.03128","DOI":"10.1109\/ACCESS.2019.2921451"},{"key":"5146_CR27","doi-asserted-by":"publisher","unstructured":"Menze, M., Geiger, A.: Object scene flow for autonomous vehicles. In: Proc. IEEE Conf. Comput. Vis. Pattern Recognit. (CVPR), pp. 3061\u20133070. IEEE, Boston, MA, USA (2015). https:\/\/doi.org\/10.1109\/CVPR.2015.7299025","DOI":"10.1109\/CVPR.2015.7299025"},{"key":"5146_CR28","doi-asserted-by":"crossref","unstructured":"Shamsafar, F., Woerz, S., Rahim, R., Zell, A.: Mobilestereonet: Towards lightweight deep networks for stereo matching. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision (WACV), pp. 2417\u20132426 (2022)","DOI":"10.1109\/WACV51458.2022.00075"},{"key":"5146_CR29","doi-asserted-by":"publisher","unstructured":"Shen, Z., Dai, Y., Rao, Z.: CFNet: Cascade and fused cost volume for robust stereo matching. In: Proc. IEEE\/CVF Conf. Comput. Vis. Pattern Recognit. (CVPR), pp. 13906\u201313915. IEEE, Virtual Event (2021). https:\/\/doi.org\/10.1109\/CVPR46437.2021.01350","DOI":"10.1109\/CVPR46437.2021.01350"},{"key":"5146_CR30","doi-asserted-by":"crossref","unstructured":"Tankovich, V., H\u00e4ne, C., Fanello, S., Bouaziz, S., Rhemann, C., Kowdle, A., Izadi, S.: Hitnet: Hierarchical iterative tile refinement network for real-time stereo matching. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 14362\u201314372 (2021)","DOI":"10.1109\/CVPR46437.2021.01413"},{"issue":"1","key":"5146_CR31","doi-asserted-by":"publisher","first-page":"1234","DOI":"10.1038\/s41598-018-19450-7","volume":"14","author":"Y Wang","year":"2024","unstructured":"Wang, Y., Zhang, H., Li, C., Liu, Y., Zhao, Y.: An efficient and accurate multi-level cascaded recurrent network for stereo matching. Sci. Rep. 14(1), 1234 (2024)","journal-title":"Sci. Rep."},{"key":"5146_CR32","unstructured":"Wei, X., Liu, J., Yang, D., Cheng, J., Shu, C., Wang, W.: A wavelet-based stereo matching framework for solving frequency convergence inconsistency. arXiv preprint (2024). https:\/\/github.com\/SIA-IDE\/Wavelet-Stereo. CVPR 2024"},{"key":"5146_CR33","doi-asserted-by":"crossref","unstructured":"Woo, S., Park, J., Lee, J.Y., Kweon, I.S.: Cbam: Convolutional block attention module. In: Proceedings of the European conference on computer vision (ECCV), pp. 3\u201319 (2018)","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"5146_CR34","doi-asserted-by":"publisher","unstructured":"Wu, Z., Wu, X., Zhang, X., Wang, S., Ju, L.: Semantic stereo matching with pyramid cost volumes. In: Proc. IEEE\/CVF Int. Conf. Comput. Vis. (ICCV), pp. 7484\u20137493. IEEE, Seoul, Korea (2019). https:\/\/doi.org\/10.1109\/ICCV.2019.00759","DOI":"10.1109\/ICCV.2019.00759"},{"key":"5146_CR35","doi-asserted-by":"crossref","unstructured":"Xie, S., Tu, Z.: Holistically-nested edge detection. In: Proceedings of the IEEE International Conference on Computer Vision (ICCV) (2015)","DOI":"10.1109\/ICCV.2015.164"},{"key":"5146_CR36","doi-asserted-by":"publisher","unstructured":"Xu, G., Cheng, J., Guo, P., Yang, X.: Attention concatenation volume for accurate and efficient stereo matching. In: Proc. IEEE\/CVF Conf. Comput. Vis. Pattern Recognit. (CVPR), pp. 12981\u201312990. IEEE, New Orleans, LA, USA (2022). https:\/\/doi.org\/10.1109\/CVPR52688.2022.01264","DOI":"10.1109\/CVPR52688.2022.01264"},{"key":"5146_CR37","doi-asserted-by":"crossref","unstructured":"Xu, G., Wang, X., Ding, X., Yang, X.: Iterative geometry encoding volume for stereo matching. In: arXiv preprint arXiv:2303.06615 (2023)","DOI":"10.1109\/CVPR52729.2023.02099"},{"key":"5146_CR38","doi-asserted-by":"publisher","unstructured":"Yang, G., Zhao, H., Shi, J., Deng, Z., Jia, J.: SegStereo: Exploiting semantic information for disparity estimation. In: Proc. Eur. Conf. Comput. Vis. (ECCV), pp. 636\u2013651. Springer, Munich, Germany (2018). https:\/\/doi.org\/10.1007\/978-3-030-01249-6_39","DOI":"10.1007\/978-3-030-01249-6_39"},{"key":"5146_CR39","doi-asserted-by":"publisher","unstructured":"Yang, X., Li, H., Qin, J., Yang, Y.: Learning wavelet coefficients for disparity estimation. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 12907\u201312916 (2020).https:\/\/doi.org\/10.1109\/CVPR42600.2020.01292. https:\/\/openaccess.thecvf.com\/content_CVPR_2020\/papers\/Yang_Learning_Wavelet_Coefficients_for_Disparity_Estimation_CVPR_2020_paper.pdf","DOI":"10.1109\/CVPR42600.2020.01292"},{"issue":"1","key":"5146_CR40","first-page":"2287","volume":"17","author":"J Zbontar","year":"2016","unstructured":"Zbontar, J., LeCun, Y.: Stereo matching by training a convolutional neural network to compare image patches. J. Mach. Learn. Res. 17(1), 2287\u20132318 (2016)","journal-title":"J. Mach. Learn. Res."},{"key":"5146_CR41","doi-asserted-by":"publisher","unstructured":"Zhang, F., Prisacariu, V., Yang, R., Torr, P.H.S.: GA-Net: Guided aggregation net for end-to-end stereo matching. In: Proc. IEEE Conf. Comput. Vis. Pattern Recognit. (CVPR), pp. 185\u2013194. IEEE, Long Beach, CA, USA (2019). https:\/\/doi.org\/10.1109\/CVPR.2019.00027","DOI":"10.1109\/CVPR.2019.00027"},{"key":"5146_CR42","unstructured":"Zhang, L., Wang, W., Chen, H., Yang, Y., Liu, S.: $$\\text{S}^{2}\\text{ m}^{2}$$: Scalable stereo matching model for reliable depth estimation. arXiv preprint arXiv:2503.12345 (2025)"},{"key":"5146_CR43","doi-asserted-by":"publisher","unstructured":"Zhang, Y., Chen, Y., Bai, X., Yu, S., Yu, K., Li, K., Yang, K.: Adaptive unimodal cost volume filtering for deep stereo matching. In: Proc. AAAI Conf. Artif. Intell., vol.\u00a034, pp. 12926\u201312934. AAAI Press, New York, NY, USA (2020). https:\/\/doi.org\/10.1609\/aaai.v34i07.6754","DOI":"10.1609\/aaai.v34i07.6754"},{"key":"5146_CR44","doi-asserted-by":"publisher","unstructured":"Zhao, Y., Zhong, H., Jia, B., Li, H.: A fast stereo matching network based on temporal attention and 2D convolution. Pattern Recognit. 144, 109808 (2023). https:\/\/doi.org\/10.1016\/j.patcog.2023.109808","DOI":"10.1016\/j.patcog.2023.109808"}],"container-title":["Signal, Image and Video Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11760-026-05146-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11760-026-05146-3","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11760-026-05146-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,22]],"date-time":"2026-03-22T22:15:51Z","timestamp":1774217751000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11760-026-05146-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2,16]]},"references-count":44,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2026,3]]}},"alternative-id":["5146"],"URL":"https:\/\/doi.org\/10.1007\/s11760-026-05146-3","relation":{},"ISSN":["1863-1703","1863-1711"],"issn-type":[{"value":"1863-1703","type":"print"},{"value":"1863-1711","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,2,16]]},"assertion":[{"value":"10 October 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 December 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 January 2026","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 February 2026","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The authors declare that they have no conflict of interest.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"90"}}