{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,5,15]],"date-time":"2025-05-15T04:50:03Z","timestamp":1747284603061},"reference-count":38,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2024,4,9]],"date-time":"2024-04-09T00:00:00Z","timestamp":1712620800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,4,9]],"date-time":"2024-04-09T00:00:00Z","timestamp":1712620800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimedia Systems"],"published-print":{"date-parts":[[2024,6]]},"DOI":"10.1007\/s00530-024-01307-x","type":"journal-article","created":{"date-parts":[[2024,4,9]],"date-time":"2024-04-09T17:01:40Z","timestamp":1712682100000},"update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Synchronous composition and semantic line detection based on cross-attention"],"prefix":"10.1007","volume":"30","author":[{"given":"Qinggang","family":"Hou","sequence":"first","affiliation":[]},{"given":"Yongzhen","family":"Ke","sequence":"additional","affiliation":[]},{"given":"Kai","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Fan","family":"Qin","sequence":"additional","affiliation":[]},{"given":"Yaoting","family":"Wang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,4,9]]},"reference":[{"key":"1307_CR1","doi-asserted-by":"crossref","unstructured":"Jin, W., Sanjabi, M., Nie, S., Tan, L., Ren, X., Firooz, H.: Msd: Saliency-aware knowledge distillation for multimodal understanding. In: Findings of the Association for Computational Linguistics: EMNLP 2021, 3557\u20133569 (2021)","DOI":"10.18653\/v1\/2021.findings-emnlp.302"},{"key":"1307_CR2","doi-asserted-by":"crossref","unstructured":"Hariharan, B., Arbelaez, P., Girshick, R., Malik, J.: Object instance segmentation and fine-grained localization using hypercolumns. IEEE Trans. Pattern Anal. Mach. Intell. (PAMI) (2016)","DOI":"10.1109\/CVPR.2015.7298642"},{"key":"1307_CR3","doi-asserted-by":"crossref","unstructured":"Mai, L., Jin, H., Liu, F.: Composition-preserving deep photo aesthetics assessment. in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition(CVPR), 497\u2013506 (2016)","DOI":"10.1109\/CVPR.2016.60"},{"key":"1307_CR4","doi-asserted-by":"publisher","DOI":"10.4324\/9780203944141","volume-title":"Photography Theory","author":"J Elkins","year":"2013","unstructured":"Elkins, J.: Photography Theory. Routledge (2013)"},{"key":"1307_CR5","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1016\/j.jvcir.2018.05.018","volume":"55","author":"J-T Lee","year":"2018","unstructured":"Lee, J.-T., Kim, H.-U., Lee, C., Kim, C.-S.: Photographic composition classification and dominant geometric element detection for outdoor scenes. J. Vis. Commun. Image Represent. 55, 91\u2013105 (2018)","journal-title":"J. Vis. Commun. Image Represent."},{"key":"1307_CR6","unstructured":"Wen, C.-L., Chia, T.-L.: The fuzzy approach for classification of the photo composition. In: 2012 International Conference on Machine Learning and Cybernetics(ICMLC), 4, IEEE, 1447\u20131453 (2012)"},{"key":"1307_CR7","doi-asserted-by":"crossref","unstructured":"Lee, J.-T., Kim, H.-U., Lee, C., Kim, C.-S.: Semantic line detection and its applications. In: Proceedings of the IEEE International Conference on Computer Vision (ICCV), 3229\u20133237 (2017)","DOI":"10.1109\/ICCV.2017.350"},{"key":"1307_CR8","doi-asserted-by":"crossref","unstructured":"Jin, D., Lee, J.-T., Kim, C.-S.: Semantic line detection using mirror attention and comparative ranking and matching. In: Proceedings of the European Conference on Computer Vision (ECCV), 119\u2013135 (2020)","DOI":"10.1007\/978-3-030-58565-5_8"},{"key":"1307_CR9","doi-asserted-by":"crossref","unstructured":"Jin, D., Park, W., Jeong, S.-G., Kim, C.-S.: Harmonious semantic line detection via maximal weight clique selection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), 16737\u201316745 (2021)","DOI":"10.1109\/CVPR46437.2021.01646"},{"key":"1307_CR10","doi-asserted-by":"crossref","unstructured":"Zhao, K., Han, Q., Zhang, C.-B., Xu, J., Cheng, M.-M.: Deep hough transform for semantic line detection. IEEE Trans. Pattern Anal. Mach. Intell. (PAMI) (2021)","DOI":"10.1109\/TPAMI.2021.3077129"},{"key":"1307_CR11","unstructured":"Hinton, G., Vinyals, O., Dean, J.: Distilling the knowledge in a neural network. arXiv preprint arXiv:1503.02531 (2015)"},{"key":"1307_CR12","doi-asserted-by":"crossref","unstructured":"Gou, J., Sun, L., Yu, B., Wan, S., Ou, W., Yi, Z.: Multi-level attention-based sample correlations for knowledge distillation. IEEE Trans. Ind. Inform. (2022)","DOI":"10.1109\/TII.2022.3209672"},{"key":"1307_CR13","unstructured":"Yu, Y., Li, B., Ji, Z., Han, J., Zhang, Z.: Knowledge distillation classifier generation network for zero-shot learning. IEEE Trans. Neural Netw. Learn. Syst. (2021)"},{"key":"1307_CR14","doi-asserted-by":"publisher","first-page":"1789","DOI":"10.1007\/s11263-021-01453-z","volume":"129","author":"J Gou","year":"2021","unstructured":"Gou, J., Yu, B., Maybank, S.J., Tao, D.: Knowledge distillation: a survey. Int. J. Comput. Vis. (IJCV) 129, 1789\u20131819 (2021)","journal-title":"Int. J. Comput. Vis. (IJCV)"},{"key":"1307_CR15","doi-asserted-by":"publisher","first-page":"690","DOI":"10.1109\/TNNLS.2016.2522428","volume":"28","author":"J Li","year":"2016","unstructured":"Li, J., Mei, X., Prokhorov, D., Tao, D.: Deep neural network for structural prediction and lane detection in traffic scene. IEEE Trans. Neural Netw. Learn. Syst. 28, 690\u2013703 (2016)","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"1307_CR16","unstructured":"Wang, Q., Han, T., Qin, Z., Gao, J., Li, X.: Multitask attention network for lane detection and fitting. IEEE Trans. Neural Netw. Learn. Syst. (2020)"},{"key":"1307_CR17","doi-asserted-by":"publisher","first-page":"2676","DOI":"10.1109\/TNNLS.2020.3007534","volume":"32","author":"Y Ji","year":"2020","unstructured":"Ji, Y., Zhang, H., Jie, Z., Ma, L., Wu, Q.J.: Casnet: A cross-attention Siamese network for video salient object detection. IEEE Trans. Neural Netw. Learn. Syst. 32, 2676\u20132690 (2020)","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"1307_CR18","unstructured":"Zhang, B., Niu, L., Zhang, L.: Image composition assessment with saliency-augmented multi-pattern pooling (2021)"},{"key":"1307_CR19","doi-asserted-by":"crossref","unstructured":"Hong, C., Du, S., Xian, K., Lu, H., Cao, Z., Zhong, W.: Composing photos like a photographer. In: 2021 IEEE Conference on Computer Vision and Pattern Recognition(CVPR), IEEE, (2021)","DOI":"10.1109\/CVPR46437.2021.00698"},{"key":"1307_CR20","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1016\/S0734-189X(88)80033-1","volume":"44","author":"J Illingworth","year":"1988","unstructured":"Illingworth, J., Kittler, J.: A survey of the hough transform. Comput. Vis. Graph. Image Process. 44, 87\u2013116 (1988)","journal-title":"Comput. Vis. Graph. Image Process."},{"key":"1307_CR21","doi-asserted-by":"crossref","unstructured":"Xue, N., Wu, T., Bai, S., Wang, F., Xia, G.-S., Zhang, L., Torr, P.\u00a0H.: Holistically-attracted wireframe parsing. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), 2788\u20132797 (2020)","DOI":"10.1109\/CVPR42600.2020.00286"},{"key":"1307_CR22","doi-asserted-by":"crossref","unstructured":"Girshick, R.: Fast r-cnn. In: Proceedings of the IEEE International Conference on Computer Vision(ICCV), 1440\u20131448 (2015)","DOI":"10.1109\/ICCV.2015.169"},{"key":"1307_CR23","doi-asserted-by":"crossref","unstructured":"Girshick, R., Donahue, J., Darrell, T., Malik, J.: Rich feature hierarchies for accurate object detection and semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition(CVPR), 580\u2013587 (2014)","DOI":"10.1109\/CVPR.2014.81"},{"key":"1307_CR24","doi-asserted-by":"crossref","unstructured":"Kong, S., Shen, X., Lin, Z., Mech, R., Fowlkes, C.: Photo aesthetics ranking network with attributes and content adaptation. In: European Conference on Computer Vision (ECCV), 662\u2013679 (2016)","DOI":"10.1007\/978-3-319-46448-0_40"},{"key":"1307_CR25","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L.-J., Li, K., Fei-Fei, L.: Imagenet: A large-scale hierarchical image database. In: 2009 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), IEEE, 248\u2013255 (2009)","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"1307_CR26","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale visual recognition. arXiv preprint arXiv:1409.1556 (2014)"},{"key":"1307_CR27","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky, O., Deng, J., Su, H., Krause, J., Satheesh, S., Ma, S., Huang, Z., Karpathy, A., Khosla, A., Bernstein, M., et al.: Imagenet large scale visual recognition challenge. Int. J. Comput. Vis. (IJCV) 115, 211\u2013252 (2015)","journal-title":"Int. J. Comput. Vis. (IJCV)"},{"key":"1307_CR28","doi-asserted-by":"crossref","unstructured":"Woo, S., Park, J., Lee, J.-Y., Kweon, I.\u00a0S.: Cbam: Convolutional block attention module. In: Proceedings of the European Conference on Computer Vision (ECCV), 3\u201319 (2018)","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"1307_CR29","doi-asserted-by":"crossref","unstructured":"Shen, Z., Cui, C., Huang, J., Zong, J., Chen, M., Yin, Y.: Deep adaptive feature aggregation in multi-task convolutional neural networks. In: Proceedings of the 29th ACM International Conference on Information & Knowledge Management, 2213\u20132216 (2020)","DOI":"10.1145\/3340531.3412132"},{"key":"1307_CR30","unstructured":"Kingma, D.P., Ba, J.: Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980 (2014)"},{"key":"1307_CR31","unstructured":"Powers, D.M.: Evaluation: from precision, recall and f-measure to roc, informedness, markedness and correlation. arXiv preprint arXiv:2010.16061 (2020)"},{"key":"1307_CR32","doi-asserted-by":"publisher","first-page":"299","DOI":"10.1109\/TKDE.2005.50","volume":"17","author":"J Huang","year":"2005","unstructured":"Huang, J., Ling, C.X.: Using AUC and accuracy in evaluating learning algorithms. IEEE Trans. Knowl. Data Eng. 17, 299\u2013310 (2005)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"1307_CR33","doi-asserted-by":"publisher","first-page":"41","DOI":"10.1023\/A:1007379606734","volume":"28","author":"R Caruana","year":"1997","unstructured":"Caruana, R.: Multitask learning. Mach. Learn. 28, 41\u201375 (1997)","journal-title":"Mach. Learn."},{"key":"1307_CR34","doi-asserted-by":"crossref","unstructured":"Misra, I., Shrivastava, A., Gupta, A., Hebert, M.: Cross-stitch networks for multi-task learning. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 3994\u20134003 (2016)","DOI":"10.1109\/CVPR.2016.433"},{"key":"1307_CR35","doi-asserted-by":"crossref","unstructured":"Gao, Y., Ma, J., Zhao, M., Liu, W., Yuille, A.L.: Nddr-cnn: Layerwise feature fusing in multi-task cnns by neural discriminative dimensionality reduction. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision(CVPR), 3205\u20133214 (2019)","DOI":"10.1109\/CVPR.2019.00332"},{"key":"1307_CR36","doi-asserted-by":"publisher","first-page":"2133","DOI":"10.1109\/TCSVT.2021.3087823","volume":"32","author":"C Cui","year":"2022","unstructured":"Cui, C., Shen, Z., Huang, J., Chen, M., Xu, M., Wang, M., Yin, Y.: Adaptive feature aggregation in deep multi-task convolutional neural networks. IEEE Trans. Circ. Syst. Video Technol. 32, 2133\u20132144 (2022)","journal-title":"IEEE Trans. Circ. Syst. Video Technol."},{"key":"1307_CR37","unstructured":"Park, J., Woo, S., Lee, J.-Y., Kweon, I.S.: Bam: Bottleneck attention module. arXiv preprint arXiv:1807.06514 (2018)"},{"key":"1307_CR38","doi-asserted-by":"crossref","unstructured":"Selvaraju, R.R., Cogswell, M., Das, A., Vedantam, R., Parikh, D., Batra, D.: Grad-cam: Visual explanations from deep networks via gradient-based localization. In: Proceedings of the IEEE International Conference on Computer Vision (ICCV), 618\u2013626 (2017)","DOI":"10.1109\/ICCV.2017.74"}],"container-title":["Multimedia Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-024-01307-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00530-024-01307-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-024-01307-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,7,5]],"date-time":"2024-07-05T17:08:50Z","timestamp":1720199330000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00530-024-01307-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4,9]]},"references-count":38,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2024,6]]}},"alternative-id":["1307"],"URL":"https:\/\/doi.org\/10.1007\/s00530-024-01307-x","relation":{},"ISSN":["0942-4962","1432-1882"],"issn-type":[{"value":"0942-4962","type":"print"},{"value":"1432-1882","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,4,9]]},"assertion":[{"value":"23 May 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 February 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 April 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"121"}}