{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,14]],"date-time":"2026-01-14T19:43:54Z","timestamp":1768419834865,"version":"3.49.0"},"reference-count":46,"publisher":"Springer Science and Business Media LLC","issue":"15","license":[{"start":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T00:00:00Z","timestamp":1759276800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T00:00:00Z","timestamp":1759276800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Appl Intell"],"published-print":{"date-parts":[[2025,10]]},"DOI":"10.1007\/s10489-025-06824-4","type":"journal-article","created":{"date-parts":[[2025,10,2]],"date-time":"2025-10-02T07:38:26Z","timestamp":1759390706000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["EGPT-SPE: story point effort estimation using improved GPT-2 by removing inefficient attention heads"],"prefix":"10.1007","volume":"55","author":[{"given":"Amna Shahid","family":"Cheemaa","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3687-0270","authenticated-orcid":false,"given":"Muhammad","family":"Azhar","sequence":"additional","affiliation":[]},{"given":"Fahim","family":"Arif","sequence":"additional","affiliation":[]},{"given":"Qazi Mazhar","family":"ul haq","sequence":"additional","affiliation":[]},{"given":"Muhammad","family":"Sohail","sequence":"additional","affiliation":[]},{"given":"Asma","family":"Iqbal","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,10,2]]},"reference":[{"issue":"2","key":"6824_CR1","doi-asserted-by":"publisher","first-page":"611","DOI":"10.1109\/TSE.2022.3158252","volume":"49","author":"M Fu","year":"2022","unstructured":"Fu M, Tantithamthavorn C (2022) GPT2SP: A transformer-based agile story point estimation approach. IEEE Trans Softw Eng 49(2):611\u2013625","journal-title":"IEEE Trans Softw Eng"},{"key":"6824_CR2","doi-asserted-by":"crossref","unstructured":"Tawosi V, Moussa R, Sarro F (2022) On the relationship between story points and development effort in Agile open-source software. In: Proceedings of the 16th ACM\/IEEE International Symposium on Empirical Software Engineering and Measurement (pp 183-194)","DOI":"10.1145\/3544902.3546238"},{"key":"6824_CR3","doi-asserted-by":"crossref","unstructured":"Tawosi V, Al-Subaihin A, Sarro F (2022) Investigating the effectiveness of clustering for story point estimation. In: 2022 IEEE International Conference on Software Analysis, Evolution and Reengineering (SANER) (pp 827-838). IEEE","DOI":"10.1109\/SANER53432.2022.00101"},{"key":"6824_CR4","doi-asserted-by":"publisher","unstructured":"Dam H (2019) Empowering Software Engineering with Artificial Intelligence. Artif Intell https:\/\/doi.org\/10.1007\/978-3-030-32242-7_3","DOI":"10.1007\/978-3-030-32242-7_3"},{"key":"6824_CR5","doi-asserted-by":"publisher","unstructured":"Alloghani M, Al-Jumeily O, Mustafna J, Hussain A, Aljaaf A (2020) A systematic review on supervised and unsupervised machine learning algorithms for data science. Supervised Unsupervised Learn Data Sci https:\/\/doi.org\/10.1007\/978-3-030-22475-2_1","DOI":"10.1007\/978-3-030-22475-2_1"},{"issue":"3","key":"6824_CR6","doi-asserted-by":"publisher","first-page":"569","DOI":"10.1007\/s41870-018-0131-2","volume":"11","author":"S Bilgaiyan","year":"2019","unstructured":"Bilgaiyan S, Mishra S, Das M (2019) Effort estimation in agile software development using experimental validation of neural network models. Int J Inf Technol 11(3):569\u2013573. https:\/\/doi.org\/10.1007\/s41870-018-0131-2","journal-title":"Int J Inf Technol"},{"issue":"4","key":"6824_CR7","doi-asserted-by":"publisher","first-page":"2605","DOI":"10.1007\/s13369-01904250-6","volume":"45","author":"A Kaushik","year":"2020","unstructured":"Kaushik A, Tayal DK, Yadav K (2020) A Comparative Analysis on Effort Estimation for Agile and Non-agile Software Projects Using DBN-ALO. Arabian J Sci Eng 45(4):2605\u20132618. https:\/\/doi.org\/10.1007\/s13369-01904250-6","journal-title":"Arabian J Sci Eng"},{"key":"6824_CR8","doi-asserted-by":"publisher","unstructured":"Kumar PS, Behera HS, Anisha Kumari K, Nayak J, Naik B (2020) Advancement from neural networks to deep learning in software effort estimation: Perspective of two decades. Comput Sci Rev 38:100288 https:\/\/doi.org\/10.1016\/j.cosrev.2020.100288","DOI":"10.1016\/j.cosrev.2020.100288"},{"key":"6824_CR9","doi-asserted-by":"publisher","first-page":"166768","DOI":"10.1109\/ACCESS.2020.3021664","volume":"8","author":"M Fern\u00e1ndez-Diego","year":"2020","unstructured":"Fern\u00e1ndez-Diego M, M\u00e9ndez ER, Gonz\u00e1lez-Ladr\u00f3n-DeGuevara F, Abrah\u00e3o S, Insfran E (2020) An update on effort estimation in agile software development: A systematic literature review. IEEE Access 8:166768\u2013166800. https:\/\/doi.org\/10.1109\/ACCESS.2020.3021664","journal-title":"IEEE Access"},{"key":"6824_CR10","doi-asserted-by":"publisher","unstructured":"Sharma A, Chaudhary N (2020) Linear Regression Model for Agile Software Development Effort Estimation. In: 2020 5th IEEE International Conference on Recent Advances in Innovative Engineering (ICRAIE 2020) (pp 4\u20137). https:\/\/doi.org\/10.1109\/ICRAIE51050.2020.9358309.","DOI":"10.1109\/ICRAIE51050.2020.9358309."},{"key":"6824_CR11","doi-asserted-by":"publisher","unstructured":"Arora M, Sharma A, Katoch S, Malviya M, Chopra S (2021) A State of the Art Regressor Model\u2019s comparison for Effort Estimation of Agile software. In: Proceedings of the 2021 2nd International Conference on Intelligent Engineering and Management (ICIEM 2021) (pp 211\u2013215). https:\/\/doi.org\/10.1109\/ICIEM51511.2021.9445345.","DOI":"10.1109\/ICIEM51511.2021.9445345."},{"issue":"2","key":"6824_CR12","first-page":"14","volume":"13","author":"M Vyas","year":"2021","unstructured":"Vyas M, Hemrajani N (2021) Predicting effort of agile software projects using linear regression, ridge regression, and logistic regression. Int J Tech Phys Prob Eng 13(2):14\u201319","journal-title":"Int J Tech Phys Prob Eng"},{"key":"6824_CR13","unstructured":"Sharma A, Chaudhary N (2021) Analysis of Software Effort Estimation Based on Story Point and Lines of Code using Machine Learning. Int J Comput Digit Syst, 1\u20138. [Online]. Available: https:\/\/journal.uob.edu.bh:443\/handle\/123456789\/4491"},{"issue":"13","key":"6824_CR14","doi-asserted-by":"publisher","first-page":"9","DOI":"10.5120\/ijca2021921014","volume":"174","author":"RK Mallidi","year":"2021","unstructured":"Mallidi RK, Sharma M (2021) Study on Agile Story Point Estimation Techniques and Challenges. Int J Comput Appl 174(13):9\u201314. https:\/\/doi.org\/10.5120\/ijca2021921014","journal-title":"Int J Comput Appl"},{"key":"6824_CR15","doi-asserted-by":"publisher","unstructured":"Radu L D (2019) Effort prediction in agile software development with Bayesian networks. In: ICSOFT 2019 - Proceedings of the 14th International Conference on Software Technologies (pp 238\u2013245). https:\/\/doi.org\/10.5220\/0007842802380245.","DOI":"10.5220\/0007842802380245."},{"key":"6824_CR16","doi-asserted-by":"publisher","unstructured":"Carvalho HDP, Lima MNCA, Santos WB, de Fagunde RA, A. (2020) Ensemble Regression Models for Software Development Effort Estimation: A Comparative Study. Int J Softw Eng Appl 11(3):71\u201386. https:\/\/doi.org\/10.5121\/ijsea.2020.11305","DOI":"10.5121\/ijsea.2020.11305"},{"key":"6824_CR17","doi-asserted-by":"publisher","DOI":"10.1002\/spe.3009","author":"Y Mahmood","year":"2021","unstructured":"Mahmood Y, Kama N, Azmi A, Khan AS, Ali M (2021) Software effort estimation accuracy prediction of machine learning techniques: A systematic performance evaluation. Softw - Practice and Exp. https:\/\/doi.org\/10.1002\/spe.3009","journal-title":"Softw - Practice and Exp"},{"key":"6824_CR18","doi-asserted-by":"publisher","unstructured":"Valerdi R (2011) 10.4.2 Convergence of Expert Opinion via the Wideband Delphi Method: An Application in Cost Estimation Models. INCOSE Int Symp, 21(1):1246\u20131259. https:\/\/doi.org\/10.1002\/j.2334-5837.2011.tb01282.x.","DOI":"10.1002\/j.2334-5837.2011.tb01282.x."},{"key":"6824_CR19","doi-asserted-by":"crossref","unstructured":"Ethayarajh K (2019) How contextual are contextualized word representations? Comparing the geometry of BERT, ELMo, and GPT-2 embeddings. arXiv:1909.00512","DOI":"10.18653\/v1\/D19-1006"},{"issue":"4","key":"6824_CR20","doi-asserted-by":"publisher","first-page":"573","DOI":"10.1109\/32.799958","volume":"25","author":"S Chulani","year":"1999","unstructured":"Chulani S, Boehm B, Steece B (1999) Bayesian analysis of empirical software engineering cost models. IEEE Trans Softw Eng 25(4):573\u2013583. https:\/\/doi.org\/10.1109\/32.799958","journal-title":"IEEE Trans Softw Eng"},{"key":"6824_CR21","doi-asserted-by":"publisher","unstructured":"Moreno A (2006) Review of \u2019Agile Estimating and Planning by Mike Cohn\u2019. Prentice Hall PTR, 2005, \\$44.99, ISBN: 0131479415. Queue, 4(5):59. https:\/\/doi.org\/10.1145\/1142031.1142049.","DOI":"10.1145\/1142031.1142049."},{"issue":"6","key":"6824_CR22","doi-asserted-by":"publisher","first-page":"872","DOI":"10.1109\/tse.2011.54","volume":"37","author":"G Concas","year":"2011","unstructured":"Concas G, Marchesi M, Murgia A, Tonelli R, Turnu I (2011) On the Distribution of Bugs in the Eclipse System. IEEE Trans Softw Eng 37(6):872\u2013877. https:\/\/doi.org\/10.1109\/tse.2011.54","journal-title":"IEEE Trans Softw Eng"},{"issue":"1","key":"6824_CR23","first-page":"2","volume":"5","author":"M Bloch","year":"2012","unstructured":"Bloch M, Blumberg S, Laartz J (2012) Delivering large-scale IT projects on time, on budget, and on value. Harvard Business Rev 5(1):2\u20137","journal-title":"Harvard Business Rev"},{"key":"6824_CR24","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1016\/j.knosys.2014.12.030","volume":"80","author":"W Pedrycz","year":"2015","unstructured":"Pedrycz W, Succi G, Sillitti A, Iljazi J (2015) Data description: A general framework of information granules. Knowl-Based Syst 80:98\u2013108. https:\/\/doi.org\/10.1016\/j.knosys.2014.12.030","journal-title":"Knowl-Based Syst"},{"issue":"7","key":"6824_CR25","doi-asserted-by":"publisher","first-page":"933","DOI":"10.1016\/j.ress.2007.03.009","volume":"93","author":"M Neil","year":"2008","unstructured":"Neil M, Tailor M, Marquez D, Fenton N, Hearty P (2008) Modelling dependable systems using hybrid Bayesian networks. Reliab Eng Syst Safety 93(7):933\u2013939. https:\/\/doi.org\/10.1016\/j.ress.2007.03.009","journal-title":"Reliab Eng Syst Safety"},{"issue":"11","key":"6824_CR26","doi-asserted-by":"publisher","first-page":"27625","DOI":"10.3390\/s151127625","volume":"15","author":"L Silva","year":"2015","unstructured":"Silva L, Almeida H, Perkusich A, Perkusich M (2015) A Model-Based Approach to Support Validation of Medical Cyber-Physical Systems. Sensors 15(11):27625\u201327670. https:\/\/doi.org\/10.3390\/s151127625","journal-title":"Sensors"},{"issue":"3","key":"6824_CR27","doi-asserted-by":"publisher","first-page":"21","DOI":"10.1145\/3468744.3468751","volume":"46","author":"M Pinzger","year":"2021","unstructured":"Pinzger M, Giger E, Gall HC (2021) Comparing fine-grained source code changes and code churn for bug prediction - A retrospective. ACM SIGSOFT Softw Eng Notes 46(3):21\u201323. https:\/\/doi.org\/10.1145\/3468744.3468751","journal-title":"ACM SIGSOFT Softw Eng Notes"},{"key":"6824_CR28","doi-asserted-by":"publisher","DOI":"10.2139\/ssrn.3813246","author":"M Fackler","year":"2021","unstructured":"Fackler M (2021) Panjer class revisited: one formula for the distributions of the Panjer (a, b, n) class. SSRN Electron J. https:\/\/doi.org\/10.2139\/ssrn.3813246","journal-title":"SSRN Electron J"},{"issue":"10","key":"6824_CR29","doi-asserted-by":"publisher","first-page":"2275","DOI":"10.1016\/j.jss.2012.04.053","volume":"85","author":"P Bhattacharya","year":"2012","unstructured":"Bhattacharya P, Neamtiu I, Shelton CR (2012) Automated, highly-accurate, bug assignment using machine learning and tossing graphs. J Syst Softw 85(10):2275\u20132292. https:\/\/doi.org\/10.1016\/j.jss.2012.04.053","journal-title":"J Syst Softw"},{"issue":"4","key":"6824_CR30","doi-asserted-by":"publisher","first-page":"531","DOI":"10.1007\/s10515-012-0111-x","volume":"19","author":"P Hooimeijer","year":"2012","unstructured":"Hooimeijer P, Weimer W (2012) StrSolve: solving string constraints lazily. Automat Softw Eng 19(4):531\u2013559. https:\/\/doi.org\/10.1007\/s10515-012-0111-x","journal-title":"Automat Softw Eng"},{"issue":"6","key":"6824_CR31","doi-asserted-by":"publisher","first-page":"551","DOI":"10.1109\/tse.2017.2693989","volume":"44","author":"M Choetkiertikul","year":"2018","unstructured":"Choetkiertikul M, Dam HK, Tran T, Ghose A, Grundy J (2018) Predicting Delivery Capability in Iterative Software Development. IEEE Trans Softw Eng 44(6):551\u2013573. https:\/\/doi.org\/10.1109\/tse.2017.2693989","journal-title":"IEEE Trans Softw Eng"},{"key":"6824_CR32","doi-asserted-by":"publisher","unstructured":"Linares-V\u00e1squez M, Vendome C, Tufano M, Poshyvanyk D (2017) How developers micro-optimize Android apps. J Syst Softw, 130, pp 1\u201323.https:\/\/doi.org\/10.1016\/j.jss.2017.04.018","DOI":"10.1016\/j.jss.2017.04.018"},{"key":"6824_CR33","unstructured":"Dam HK, Tran T, Pham T (2016) A deep language model for software code. arXiv:1608.02715 [cs, stat]. [Accessed 5 Jan. 2023]"},{"key":"6824_CR34","doi-asserted-by":"publisher","unstructured":"Gu X, Zhang H, Zhang D, Kim S (2016) Deep API learning. In: Proc 24th ACM SIGSOFT Int Symp Found Softw Eng, pp 631\u2013642. https:\/\/doi.org\/10.1145\/2950290.2950334","DOI":"10.1145\/2950290.2950334"},{"key":"6824_CR35","doi-asserted-by":"publisher","unstructured":"Gupta R, Pal S, Kanade A, Shevade S (2017) DeepFix: Fixing Common C Language Errors by Deep Learning. Proceed AAAI Conf Artif Intell, 31(1). https:\/\/doi.org\/10.1609\/aaai.v31i1.10742","DOI":"10.1609\/aaai.v31i1.10742"},{"key":"6824_CR36","doi-asserted-by":"publisher","unstructured":"Hinton GE (2006) Reducing the Dimensionality of Data with Neural Networks. Science, [online] 313(5786), pp 504\u2013507. https:\/\/doi.org\/10.1126\/science.1127647","DOI":"10.1126\/science.1127647"},{"issue":"7","key":"6824_CR37","doi-asserted-by":"publisher","first-page":"637","DOI":"10.1109\/TSE.2018.2792473","volume":"45","author":"M Choetkiertikul","year":"2019","unstructured":"Choetkiertikul M, Dam HK, Tran T, Pham T, Ghose A, Menzies T (2019) A deep learning model for estimating story points. IEEE Trans Softw Eng 45(7):637\u2013656","journal-title":"IEEE Trans Softw Eng"},{"issue":"2","key":"6824_CR38","doi-asserted-by":"publisher","first-page":"425","DOI":"10.1109\/TSE.2011.27","volume":"38","author":"E Kocaguneli","year":"2012","unstructured":"Kocaguneli E, Menzies T, Bener A, Keung JW (2012) Exploiting the essential assumptions of analogy-based effort estimation. IEEE Trans Softw Eng 38(2):425\u2013438","journal-title":"IEEE Trans Softw Eng"},{"issue":"3","key":"6824_CR39","doi-asserted-by":"publisher","first-page":"813","DOI":"10.1007\/s10664-014-9300-5","volume":"20","author":"E Kocaguneli","year":"2015","unstructured":"Kocaguneli E, Menzies T, Mendes E (2015) Transfer learning in effort estimation. Empir Softw Eng 20(3):813\u2013843","journal-title":"Empir Softw Eng"},{"issue":"2","key":"6824_CR40","doi-asserted-by":"publisher","first-page":"241","DOI":"10.1016\/j.jss.2008.06.001","volume":"82","author":"Y-F Li","year":"2009","unstructured":"Li Y-F, Xie M, Goh TN (2009) A study of project selection and feature weighting for analogy-based software cost estimation. J Syst Softw 82(2):241\u2013252","journal-title":"J Syst Softw"},{"key":"6824_CR41","doi-asserted-by":"crossref","unstructured":"Ding Y, Ray B, Devanbu P, Hellendoorn V J (2020) \u201cPatching as translation: The data and the metaphor,\u201d In: Proc 35th IEEE\/ACM Int Conf Automated Softw Eng, pp 275\u2013286","DOI":"10.1145\/3324884.3416587"},{"key":"6824_CR42","doi-asserted-by":"crossref","unstructured":"Jiang N, Lutellier T, Tan L (2021) \u201cCURE: Code-aware neural machine translation for automatic program repair,\u201d In: Proc Int Conf Softw Eng, pp 1161\u20131173","DOI":"10.1109\/ICSE43902.2021.00107"},{"key":"6824_CR43","doi-asserted-by":"crossref","unstructured":"Karampatsis R-M, Babii H, Robbes R, Sutton C, Janes A (2020) \u201cBig code != Big vocabulary: Open-vocabulary models for source code,\u201d In: Proc. IEEE\/ACM 42nd Int Conf Softw Eng, pp 1073\u20131085","DOI":"10.1145\/3377811.3380342"},{"key":"6824_CR44","doi-asserted-by":"crossref","unstructured":"Porru A, Murgia S, Demeyer M, Marchesi R, Tonelli (2016)\u201cEstimating story points from issue reports,\u201d In: Proc 12th Int Conf Predictive Models Data Anal Softw Eng, pp 1\u201310","DOI":"10.1145\/2972958.2972959"},{"key":"6824_CR45","unstructured":"[Online] GitHub Repository: https:\/\/github.com\/jai2shukla\/JIRA-Estimation-Prediction\/blob\/master\/README.md"},{"key":"6824_CR46","unstructured":"TAWOS GitHub Repository: https:\/\/github.com\/SOLAR-group\/TAWOS"}],"container-title":["Applied Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-025-06824-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10489-025-06824-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-025-06824-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,7]],"date-time":"2025-11-07T15:43:04Z","timestamp":1762530184000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10489-025-06824-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10]]},"references-count":46,"journal-issue":{"issue":"15","published-print":{"date-parts":[[2025,10]]}},"alternative-id":["6824"],"URL":"https:\/\/doi.org\/10.1007\/s10489-025-06824-4","relation":{},"ISSN":["0924-669X","1573-7497"],"issn-type":[{"value":"0924-669X","type":"print"},{"value":"1573-7497","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,10]]},"assertion":[{"value":"31 July 2025","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 October 2025","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper\u2019s interest. We certify that the submission is original work and is not under review at any other publication.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing Interests"}},{"value":"This study does not contain any studies with human or animal subjects performed by any of the authors.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical and Informed Consent for Data Used"}}],"article-number":"994"}}