{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,14]],"date-time":"2025-11-14T06:39:24Z","timestamp":1763102364959,"version":"3.45.0"},"reference-count":41,"publisher":"Tech Science Press","issue":"1","license":[{"start":{"date-parts":[[2025,3,30]],"date-time":"2025-03-30T00:00:00Z","timestamp":1743292800000},"content-version":"vor","delay-in-days":88,"URL":"https:\/\/doi.org\/10.32604\/TSP-CROSSMARKPOLICY"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["CMC"],"published-print":{"date-parts":[[2025]]},"DOI":"10.32604\/cmc.2025.060395","type":"journal-article","created":{"date-parts":[[2025,2,10]],"date-time":"2025-02-10T02:53:32Z","timestamp":1739156012000},"page":"761-783","update-policy":"https:\/\/doi.org\/10.32604\/tsp-crossmarkpolicy","source":"Crossref","is-referenced-by-count":0,"title":["MMCSD: Multi-Modal Knowledge Graph Completion Based on Super-Resolution and Detailed Description Generation"],"prefix":"10.32604","volume":"83","author":[{"given":"Huansha","family":"Wang","sequence":"first","affiliation":[]},{"given":"Ruiyang","family":"Huang","sequence":"additional","affiliation":[]},{"given":"Qinrang","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Shaomei","family":"Li","sequence":"additional","affiliation":[]},{"given":"Jianpeng","family":"Zhang","sequence":"additional","affiliation":[]}],"member":"17807","published-online":{"date-parts":[[2025]]},"reference":[{"key":"ref1","series-title":"Proceedings of the Twenty-Sixth International Joint Conference on Artificial Intelligence","first-page":"3140","article-title":"Image-embodied knowledge representation learning","volume":"2017","author":"Xie","year":"2017 Aug 19\u201326"},{"key":"ref2","series-title":"Proceedings of the Seventh Joint Conference on Lexical and Computational Semantics","first-page":"225","article-title":"A multimodal translation-based approach for knowledge Graph Representation learning","author":"Mousselly Sergieh","year":"2018"},{"key":"ref3","series-title":"2019 International Joint Conference on Neural Networks (IJCNN)","first-page":"1","article-title":"Multimodal data enhanced representation learning for knowledge graphs","volume":"2019","author":"Wang","year":"2019 Jul 14\u201319"},{"key":"ref4","series-title":"2023 International Joint Conference on Neural Networks (IJCNN)","first-page":"1","article-title":"Modality-aware negative sampling for multi-modal knowledge graph embedding","volume":"2023","author":"Zhang","year":"2023 Jun 18\u201323"},{"key":"ref5","series-title":"Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing","first-page":"10527","article-title":"MoSE: modality split and ensemble for multimodal knowledge graph completion","author":"Zhao","year":"2022"},{"key":"ref6","series-title":"Proceedings of the 32nd ACM International Conference on Multimedia","first-page":"233","article-title":"Making large language models perform better in knowledge graph completion","author":"Zhang","year":"2024"},{"key":"ref7","doi-asserted-by":"crossref","first-page":"123","DOI":"10.1007\/978-3-031-44693-1_10","author":"Zhang","year":"2023","journal-title":"Natural language processing and Chinese computing"},{"key":"ref8","series-title":"2017 IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)","first-page":"1132","article-title":"Enhanced deep residual networks for single image super-resolution","volume":"2017","author":"Lim","year":"2017 Jul 21\u201326"},{"key":"ref9","series-title":"Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing","first-page":"1499","article-title":"Representing text for joint embedding of text and knowledge bases","author":"Toutanova","year":"2015"},{"key":"ref10","doi-asserted-by":"crossref","first-page":"459","DOI":"10.1007\/978-3-030-21348-0_30","author":"Liu","year":"2019","journal-title":"The semantic web"},{"key":"ref11","series-title":"NIPS\u201913: Proceedings of the 27th International Conference on Neural Information Processing Systems (NIPS)","first-page":"2787","article-title":"Translating embeddings for modeling multi relational data","author":"Bordes","year":"2013 Dec 5\u20138"},{"key":"ref12","first-page":"1112","article-title":"Knowledge graph embedding by translating on hyperplanes","author":"Wang","year":"2014","journal-title":"Proc AAAI Conf Artif Intell"},{"key":"ref13","unstructured":"Sun Z, Deng Z, Nie J, Tang J. RotatE: knowledge graph embedding by relational rotation in complex space. arXiv:1902.10197. 2019."},{"key":"ref14","first-page":"1811","article-title":"Convolutional 2D knowledge graph embeddings","author":"Dettmers","year":"2018","journal-title":"Proc AAAI Conf Artif Intell"},{"key":"ref15","series-title":"Proceedings of the 2018 Conference of the North American Chapter Of the Association for Computational Linguistics: Human Language Technologies","first-page":"327","article-title":"A novel embedding model for knowledge base completion based on Convolutional neural network","author":"Nguyen","year":"2018"},{"key":"ref16","first-page":"593","author":"Schlichtkrull","year":"2018","journal-title":"The semantic web"},{"key":"ref17","series-title":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","first-page":"4710","article-title":"Learning attention-based embeddings for relation prediction in knowledge graphs","author":"Nathani","year":"2019"},{"key":"ref18","series-title":"NIPS\u201917: Proceedings of the 31st International Conference on Neural Information Processing Systems","first-page":"5998","article-title":"Attention is all you need","author":"Vaswani","year":"2017 Dec 4\u20139"},{"key":"ref19","doi-asserted-by":"crossref","first-page":"84","DOI":"10.1007\/978-3-319-68204-4_8","author":"Ferrada","year":"2017","journal-title":"The semantic web-ISWC 2017"},{"key":"ref20","series-title":"Proceedings of the 1st Workshop on Multilingual Representation Learning","first-page":"138","article-title":"VisualSem: a high-quality knowledge graph for vision and language","author":"Alberts","year":"2021"},{"key":"ref21","series-title":"Proceedings of the 30th ACM International Conference on Information & Knowledge Management","first-page":"4445","article-title":"GAKG: a multimodal geoscience academic knowledge graph","author":"Deng","year":"2021 Nov 1\u20135"},{"key":"ref22","series-title":"Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing","first-page":"3208","article-title":"Embedding multimodal relational data for knowledge base completion","author":"Pezeshkpour","year":"2018"},{"key":"ref23","unstructured":"Zhang Y, Zhang W. Knowledge graph completion with pre-trained multimodal transformer and twins negative sampling. arXiv:2209.07084. 2022."},{"key":"ref24","unstructured":"Kipf TN, Welling M. Semi supervised classification with graph convolutional networks. arXiv:1609.02907. 2017."},{"key":"ref25","unstructured":"Velickovic P, Cucurull G, Casanova A, Romero A, Li\u00f2 P, Bengio Y. Graph attention networks. arXiv:1710.10903. 2018."},{"key":"ref26","series-title":"2024 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","first-page":"26753","article-title":"Monkey: image resolution and text label are important things for large multi-modal models","volume":"2024","author":"Li","year":"2024 Jun 16\u201322"},{"key":"ref27","series-title":"International Conference on Machine Learning","first-page":"19730","article-title":"BLIP-2: bootstrapping language-image pre-training with frozen image encoders and large language models","author":"Li","year":"2023 Jul 23\u201329"},{"key":"ref28","unstructured":"Du Y, Li C, Guo R, Yin X, Liu W, Zhou J, et al. PP-OCR: a practical ultra lightweight OCR system. arXiv:2009.09941. 2020."},{"key":"ref29","series-title":"Computer Vision-ECCV 2024-18th European Conference","first-page":"207","article-title":"GRiT: a generative region-to-text transformer for object understanding","author":"Wu","year":"2024 Sep 29\u2013Oct 4"},{"key":"ref30","unstructured":"Zhao X, Ding W, An Y, Du Y, Yu T, Li M, et al. Fast segment anything. arXiv:2306.12156. 2023."},{"key":"ref31","unstructured":"Bai J, Bai S, Chu Y, Cui Z, Dang K, Deng X, et al. Qwen technical report. arXiv.2309.16609. 2024."},{"key":"ref32","unstructured":"Kingma DP, Welling M. Auto-encoding variational bayes. arXiv:1312.6114. 2022."},{"key":"ref33","series-title":"22nd International Semantic Web Conference","first-page":"121","article-title":"Rethinking uncertainly missing and ambiguous visual modality in multi-modal entity alignment","author":"Chen","year":"2023 Nov 6\u201310"},{"key":"ref34","series-title":"Proceedings of the 38th International Conference on Machine Learning (PMLR 139)","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","author":"Radford","year":"2021 Jul 18\u201324"},{"key":"ref35","series-title":"3rd International Conference on Learning Representations, ICLR 2015","article-title":"Embedding entities and relations for learning and inference in knowledge bases","author":"Yang","year":"2015 May 7\u20139"},{"key":"ref36","series-title":"Proceedings of the 33rd International Conference on Machine Learning","first-page":"2071","article-title":"Complex embeddings for simple link prediction","author":"Trouillon","year":"2016 Jun 19\u201324"},{"key":"ref37","series-title":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","first-page":"904","article-title":"Hybrid transformer with multi-level fusion for multimodal knowledge graph completion","author":"Chen","year":"2022"},{"key":"ref38","series-title":"Proceedings of the ACM Web Conference 2023","first-page":"2572","article-title":"IMF: interactive multimodal fusion model for link prediction","author":"Li","year":"2023"},{"key":"ref39","first-page":"8957","article-title":"LAFA: multimodal knowledge graph completion with link aware fusion and aggregation","volume":"38","author":"Shang","year":"2024","journal-title":"Proc AAAI Conf Artif Intell"},{"key":"ref40","series-title":"Proceedings of the 47th International ACM SIGIR Conference on Research and Development in Information Retrieval","first-page":"102","article-title":"Contrast then memorize: semantic neighbor retrieval-enhanced inductive multimodal knowledge graph completion","author":"Zhao","year":"2024"},{"key":"ref41","first-page":"1","article-title":"HKA: a hierarknowledge alignment framework for multimodal knowledge graph completion","volume":"20","author":"Xu","year":"2024","journal-title":"ACM Trans Multimed Comput Commun Appl"}],"container-title":["Computers, Materials &amp; Continua"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/cdn.techscience.cn\/files\/cmc\/2025\/TSP_CMC-83-1\/TSP_CMC_60395\/TSP_CMC_60395.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,14]],"date-time":"2025-11-14T06:36:21Z","timestamp":1763102181000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.techscience.com\/cmc\/v83n1\/60096"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"references-count":41,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2025]]},"published-print":{"date-parts":[[2025]]}},"URL":"https:\/\/doi.org\/10.32604\/cmc.2025.060395","relation":{},"ISSN":["1546-2226"],"issn-type":[{"type":"electronic","value":"1546-2226"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"2024-10-31","order":0,"name":"received","label":"Received","group":{"name":"publication_history","label":"Publication History"}},{"value":"2025-01-20","order":1,"name":"accepted","label":"Accepted","group":{"name":"publication_history","label":"Publication History"}},{"value":"2025-03-26","order":2,"name":"published","label":"Published Online","group":{"name":"publication_history","label":"Publication History"}}]}}