{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T19:35:29Z","timestamp":1777664129646,"version":"3.51.4"},"publisher-location":"Singapore","reference-count":50,"publisher":"Springer Nature Singapore","isbn-type":[{"value":"9789819666027","type":"print"},{"value":"9789819666034","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,7,9]],"date-time":"2025-07-09T00:00:00Z","timestamp":1752019200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,7,9]],"date-time":"2025-07-09T00:00:00Z","timestamp":1752019200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-981-96-6603-4_18","type":"book-chapter","created":{"date-parts":[[2025,7,8]],"date-time":"2025-07-08T11:15:29Z","timestamp":1751973329000},"page":"253-268","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["PEDRO: Parameter-Efficient Fine-Tuning with\u00a0Prompt DEpenDent Representation MOdification"],"prefix":"10.1007","author":[{"given":"Tianfang","family":"Xie","sequence":"first","affiliation":[]},{"given":"Tianjing","family":"Li","sequence":"additional","affiliation":[]},{"given":"Wei","family":"Zhu","sequence":"additional","affiliation":[]},{"given":"Wei","family":"Han","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,7,9]]},"reference":[{"key":"18_CR1","doi-asserted-by":"publisher","unstructured":"Aghajanyan, A., Gupta, S., Zettlemoyer, L.: Intrinsic dimensionality explains the effectiveness of language model fine-tuning. In: Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Volume 1: Long Papers), pp. 7319\u20137328. Association for Computational Linguistics (2021). https:\/\/doi.org\/10.18653\/v1\/2021.acl-long.568, https:\/\/aclanthology.org\/2021.acl-long.568","DOI":"10.18653\/v1\/2021.acl-long.568"},{"key":"18_CR2","doi-asserted-by":"crossref","unstructured":"Ben-Zaken, E., Ravfogel, S., Goldberg, Y.: Bitfit: simple parameter-efficient fine-tuning for transformer-based masked language-models. ArXiv arXiv:2106.10199 (2021)","DOI":"10.18653\/v1\/2022.acl-short.1"},{"key":"18_CR3","unstructured":"Boull\u2019e, N., Nakatsukasa, Y., Townsend, A.: Rational neural networks. ArXiv arXiv:2004.01902 (2020). https:\/\/api.semanticscholar.org\/CorpusID:214802374"},{"key":"18_CR4","unstructured":"Chen, L., Ye, Z., Wu, Y., Zhuo, D., Ceze, L., Krishnamurthy, A.: Punica: multi-tenant lora serving. ArXiv arXiv:2310.18547 (2023). https:\/\/api.semanticscholar.org\/CorpusID:264590197"},{"key":"18_CR5","unstructured":"Delfosse, Q., Schramowski, P., Molina, A., Kersting, K.: Recurrent rational networks. arXiv preprint arXiv:2102.09407 (2021)"},{"key":"18_CR6","unstructured":"Delfosse, Q., Schramowski, P., Mundt, M., Molina, A., Kersting, K.: Adaptive rational activations to boost deep reinforcement learning (2021). https:\/\/api.semanticscholar.org\/CorpusID:246430610"},{"key":"18_CR7","doi-asserted-by":"crossref","unstructured":"Dettmers, T., Pagnoni, A., Holtzman, A., Zettlemoyer, L.: QLoRA: efficient finetuning of quantized LLMs. arXiv e-prints arXiv:2305.14314 (2023)","DOI":"10.52202\/075280-0441"},{"key":"18_CR8","doi-asserted-by":"crossref","unstructured":"Ding, N., et al.: Delta tuning: a comprehensive study of parameter efficient methods for pre-trained language models. ArXiv arXiv:2203.06904 (2022)","DOI":"10.21203\/rs.3.rs-1553541\/v1"},{"key":"18_CR9","unstructured":"Gholamalinezhad, H., Khosravi, H.: Pooling methods in deep neural networks, a review. arXiv preprint arXiv:2009.07485 (2020)"},{"key":"18_CR10","unstructured":"Gong, J., Qiu, X., Wang, S., Huang, X.: Information aggregation via dynamic routing for sequence encoding. In: COLING (2018)"},{"key":"18_CR11","doi-asserted-by":"publisher","unstructured":"Guo, D., Rush, A., Kim, Y.: Parameter-efficient transfer learning with diff pruning. In: Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Volume 1: Long Papers), pp. 4884\u20134896. Association for Computational Linguistics (2021). https:\/\/doi.org\/10.18653\/v1\/2021.acl-long.378, https:\/\/aclanthology.org\/2021.acl-long.378","DOI":"10.18653\/v1\/2021.acl-long.378"},{"key":"18_CR12","unstructured":"Hendrycks, D., et al.: Measuring massive multitask language understanding. arXiv preprint arXiv:2009.03300 (2020)"},{"key":"18_CR13","unstructured":"Hendrycks, D., Gimpel, K.: Gaussian error linear units (gelus). arXiv: Learning (2016)"},{"key":"18_CR14","unstructured":"Houlsby, N., et al.: Parameter-efficient transfer learning for NLP. In: International Conference on Machine Learning, pp. 2790\u20132799. PMLR (2019)"},{"key":"18_CR15","unstructured":"Hu, E.J., et al.: Lora: low-rank adaptation of large language models. arXiv preprint arXiv:2106.09685 (2021)"},{"key":"18_CR16","unstructured":"Hu, S., et al.: Sparse structure search for parameter-efficient tuning. ArXiv arXiv:2206.07382 (2022)"},{"key":"18_CR17","unstructured":"Huang, Y., et\u00a0al.: C-eval: a multi-level multi-discipline Chinese evaluation suite for foundation models. arXiv preprint arXiv:2305.08322 (2023)"},{"key":"18_CR18","doi-asserted-by":"crossref","unstructured":"Lester, B., Al-Rfou, R., Constant, N.: The power of scale for parameter-efficient prompt tuning. arXiv preprint arXiv:2104.08691 (2021)","DOI":"10.18653\/v1\/2021.emnlp-main.243"},{"key":"18_CR19","doi-asserted-by":"crossref","unstructured":"Lewis, M., et al.: Bart: denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension. arXiv preprint arXiv:1910.13461 (2019)","DOI":"10.18653\/v1\/2020.acl-main.703"},{"key":"18_CR20","doi-asserted-by":"crossref","unstructured":"Li, H., et al.: Cmmlu: measuring massive multitask language understanding in Chinese. arXiv preprint arXiv:2306.09212 (2023)","DOI":"10.18653\/v1\/2024.findings-acl.671"},{"key":"18_CR21","unstructured":"Li, X.L., Liang, P.: Prefix-tuning: optimizing continuous prompts for generation. arXiv preprint arXiv:2101.00190 (2021)"},{"key":"18_CR22","doi-asserted-by":"crossref","unstructured":"Li, X., et al.: Unified demonstration retriever for in-context learning. In: Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 4644\u20134668 (2023)","DOI":"10.18653\/v1\/2023.acl-long.256"},{"key":"18_CR23","unstructured":"Liu, H., Simonyan, K., Yang, Y.: Darts: differentiable architecture search. ArXiv arXiv:1806.09055 (2019)"},{"key":"18_CR24","unstructured":"Liu, H., et al.: Few-shot parameter-efficient fine-tuning is better and cheaper than in-context learning. ArXiv arXiv:2205.05638 (2022). https:\/\/api.semanticscholar.org\/CorpusID:248693283"},{"key":"18_CR25","doi-asserted-by":"crossref","unstructured":"Liu, X., Sun, T., Huang, X., Qiu, X.: Late prompt tuning: a late prompt could be better than many prompts. ArXiv arXiv:2210.11292 (2022)","DOI":"10.18653\/v1\/2022.findings-emnlp.95"},{"key":"18_CR26","doi-asserted-by":"crossref","unstructured":"Liu, X., Ji, K., Fu, Y., Du, Z., Yang, Z., Tang, J.: P-tuning v2: prompt tuning can be comparable to fine-tuning universally across scales and tasks. ArXiv arXiv:2110.07602 (2021)","DOI":"10.18653\/v1\/2022.acl-short.8"},{"key":"18_CR27","doi-asserted-by":"crossref","unstructured":"Liu, X., et al.: P-tuning: prompt tuning can be comparable to fine-tuning across scales and tasks. In: Annual Meeting of the Association for Computational Linguistics (2022)","DOI":"10.18653\/v1\/2022.acl-short.8"},{"key":"18_CR28","unstructured":"Mahabadi, R.K., Henderson, J., Ruder, S.: Compacter: efficient low-rank hypercomplex adapter layers. In: NeurIPS (2021)"},{"key":"18_CR29","unstructured":"Molina, A., Schramowski, P., Kersting, K.: Pad\u00e9 activation units: end-to-end learning of flexible activation functions in deep networks. ArXiv arXiv:1907.06732 (2019). https:\/\/api.semanticscholar.org\/CorpusID:196831891"},{"key":"18_CR30","unstructured":"OpenAI: GPT-4 Technical Report. arXiv e-prints arXiv:2303.08774 (2023)"},{"key":"18_CR31","doi-asserted-by":"publisher","unstructured":"Pfeiffer, J., Kamath, A., R\u00fcckl\u00e9, A., Cho, K., Gurevych, I.: AdapterFusion: non-destructive task composition for transfer learning. In: Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics: Main Volume. pp. 487\u2013503. Association for Computational Linguistics (2021). https:\/\/doi.org\/10.18653\/v1\/2021.eacl-main.39, https:\/\/aclanthology.org\/2021.eacl-main.39","DOI":"10.18653\/v1\/2021.eacl-main.39"},{"key":"18_CR32","doi-asserted-by":"crossref","unstructured":"Qin, C., Zhang, A., Zhang, Z., Chen, J., Yasunaga, M., Yang, D.: Is ChatGPT a general-purpose natural language processing task solver? arXiv preprint arXiv:2302.06476 (2023)","DOI":"10.18653\/v1\/2023.emnlp-main.85"},{"key":"18_CR33","unstructured":"Radford, A., Narasimhan, K., Salimans, T., Sutskever, I., et\u00a0al.: Improving language understanding by generative pre-training. OpenAI (2018)"},{"key":"18_CR34","doi-asserted-by":"publisher","unstructured":"Rajpurkar, P., Zhang, J., Lopyrev, K., Liang, P.: SQuAD: 100,000+ questions for machine comprehension of text. In: Proceedings of the 2016 Conference on Empirical Methods in Natural Language Processing, pp. 2383\u20132392. Association for Computational Linguistics, Austin, Texas (2016).https:\/\/doi.org\/10.18653\/v1\/D16-1264, https:\/\/www.aclweb.org\/anthology\/D16-1264","DOI":"10.18653\/v1\/D16-1264"},{"key":"18_CR35","doi-asserted-by":"crossref","unstructured":"Rubin, O., Herzig, J., Berant, J.: Learning to retrieve prompts for in-context learning. In: Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, pp. 2655\u20132671 (2022)","DOI":"10.18653\/v1\/2022.naacl-main.191"},{"key":"18_CR36","doi-asserted-by":"crossref","unstructured":"R\u00fcckl\u00e9, A., et al.: Adapterdrop: on the efficiency of adapters in transformers. In: Conference on Empirical Methods in Natural Language Processing (2020)","DOI":"10.18653\/v1\/2021.emnlp-main.626"},{"key":"18_CR37","doi-asserted-by":"crossref","unstructured":"Suzgun, M., et\u00a0al.: Challenging big-bench tasks and whether chain-of-thought can solve them. arXiv preprint arXiv:2210.09261 (2022)","DOI":"10.18653\/v1\/2023.findings-acl.824"},{"key":"18_CR38","unstructured":"Taori, R., et al.: Stanford alpaca: an instruction-following llama model (2023). https:\/\/github.com\/tatsu-lab\/stanford_alpaca"},{"key":"18_CR39","unstructured":"Team, G., et\u00a0al.: Gemma: open models based on gemini research and technology. arXiv preprint arXiv:2403.08295 (2024)"},{"key":"18_CR40","unstructured":"Touvron, H., et al.: Llama 2: open foundation and fine-tuned chat models. ArXiv arXiv:2307.09288 (2023). https:\/\/api.semanticscholar.org\/CorpusID:259950998"},{"key":"18_CR41","unstructured":"Vaswani, A., et al.: Attention is all you need. ArXiv arXiv:1706.03762 (2017)"},{"key":"18_CR42","unstructured":"Wang, A., et al.: Superglue: a stickier benchmark for general-purpose language understanding systems. ArXiv arXiv:1905.00537 (2019)"},{"key":"18_CR43","doi-asserted-by":"crossref","unstructured":"Wang, A., Singh, A., Michael, J., Hill, F., Levy, O., Bowman, S.R.: Glue: a multi-task benchmark and analysis platform for natural language understanding. In: BlackboxNLP@EMNLP (2018)","DOI":"10.18653\/v1\/W18-5446"},{"key":"18_CR44","unstructured":"Wolf, T., et al.: Transformers: state-of-the-art natural language processing. In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing: System Demonstrations, pp. 38\u201345. Association for Computational Linguistics (2020). https:\/\/www.aclweb.org\/anthology\/2020.emnlp-demos.6"},{"key":"18_CR45","unstructured":"Zhang, Q., et al.: Adaptive budget allocation for parameter-efficient fine-tuning. ArXiv arXiv:2303.10512 (2023). https:\/\/api.semanticscholar.org\/CorpusID:257631760"},{"key":"18_CR46","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Wang, P., Tan, M., Zhu, W.G.: Learned adapters are better than manually designed adapters. In: Annual Meeting of the Association for Computational Linguistics (2023). https:\/\/api.semanticscholar.org\/CorpusID:259858833","DOI":"10.18653\/v1\/2023.findings-acl.468"},{"key":"18_CR47","doi-asserted-by":"publisher","unstructured":"Zhao, M., Lin, T., Mi, F., Jaggi, M., Sch\u00fctze, H.: Masking as an efficient alternative to finetuning for pretrained language models. In: Webber, B., Cohn, T., He, Y., Liu, Y. (eds.) Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 2226\u20132241. Association for Computational Linguistics (2020). https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-main.174, https:\/\/aclanthology.org\/2020.emnlp-main.174","DOI":"10.18653\/v1\/2020.emnlp-main.174"},{"key":"18_CR48","unstructured":"Zhao, W.X., et al.: A survey of large language models. arXiv e-prints arXiv:2303.18223 (2023)"},{"key":"18_CR49","unstructured":"Zheng, L., et al.: Judging LLM-as-a-judge with MT-bench and chatbot arena. arXiv e-prints arXiv:2306.05685 (2023)"},{"key":"18_CR50","doi-asserted-by":"crossref","unstructured":"Zhu, W., Wang, X., Zheng, H., Chen, M., Tang, B.: PromptCBLUE: a Chinese prompt tuning benchmark for the medical domain. arXiv e-prints arXiv:2310.14151 (2023)","DOI":"10.2139\/ssrn.4685921"}],"container-title":["Lecture Notes in Computer Science","Neural Information Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-96-6603-4_18","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T07:34:55Z","timestamp":1777448095000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-96-6603-4_18"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,7,9]]},"ISBN":["9789819666027","9789819666034"],"references-count":50,"URL":"https:\/\/doi.org\/10.1007\/978-981-96-6603-4_18","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,7,9]]},"assertion":[{"value":"9 July 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"ICONIP","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Neural Information Processing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Auckland","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"New Zealand","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2 December 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"6 December 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"31","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"iconip2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/iconip2024.org","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}