{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T03:21:07Z","timestamp":1740108067335,"version":"3.37.3"},"reference-count":40,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2024,11,20]],"date-time":"2024-11-20T00:00:00Z","timestamp":1732060800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,20]],"date-time":"2024-11-20T00:00:00Z","timestamp":1732060800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Neural Comput &amp; Applic"],"published-print":{"date-parts":[[2025,2]]},"DOI":"10.1007\/s00521-024-10535-1","type":"journal-article","created":{"date-parts":[[2024,11,20]],"date-time":"2024-11-20T09:27:16Z","timestamp":1732094836000},"page":"1771-1782","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["TinyBERT for branch prediction in modern microprocessors"],"prefix":"10.1007","volume":"37","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-4795-5915","authenticated-orcid":false,"given":"Anwar","family":"Alajmi","sequence":"first","affiliation":[]},{"given":"Bashair","family":"AlSarraf","sequence":"additional","affiliation":[]},{"given":"Zainab","family":"Abualhassan","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6859-4621","authenticated-orcid":false,"given":"Abbas A.","family":"Fairouz","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0673-7324","authenticated-orcid":false,"given":"Imtiaz","family":"Ahmad","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,20]]},"reference":[{"key":"10535_CR1","unstructured":"Sambo MK (2023) A comparative study of pipelining, branch prediction, and superscalar architectures for enhanced computer performance. Computer Science"},{"issue":"2","key":"10535_CR2","doi-asserted-by":"crossref","first-page":"276","DOI":"10.1145\/225830.224438","volume":"23","author":"C Young","year":"1995","unstructured":"Young C, Gloy N, Smith MD (1995) A comparative analysis of schemes for correlated branch prediction. ACM SIGARCH Computer Arch News 23(2):276\u2013286","journal-title":"ACM SIGARCH Computer Arch News"},{"key":"10535_CR3","doi-asserted-by":"crossref","unstructured":"Lin C-K, Tarsa SJ (2019) Branch prediction is not a solved problem: Measurements, opportunities, and future directions. arXiv preprint","DOI":"10.1109\/IISWC47752.2019.9042108"},{"key":"10535_CR4","unstructured":"Sbera M, Vintan LN, Florea A (2001) Static and dynamic branch prediction using neural networks. Computer Science"},{"issue":"7","key":"10535_CR5","doi-asserted-by":"crossref","first-page":"3235","DOI":"10.3390\/app11073235","volume":"11","author":"H Choi","year":"2021","unstructured":"Choi H, Park S (2021) A survey of machine learning-based system performance optimization techniques. Appl Sci 11(7):3235","journal-title":"Appl Sci"},{"issue":"1\u20132","key":"10535_CR6","first-page":"102","volume":"23","author":"JW Fu","year":"1992","unstructured":"Fu JW, Patel JH, Janssens BL (1992) Stride directed prefetching in scalar processors. ACM SIGMICRO Newsletter 23(1\u20132):102\u2013110","journal-title":"ACM SIGMICRO Newsletter"},{"issue":"7553","key":"10535_CR7","first-page":"436","volume":"521","author":"Y LeCun","year":"2015","unstructured":"LeCun Y, Bengio Y, Hinton G (2015) Deep learning. nature 521(7553):436\u2013444","journal-title":"Deep learning. nature"},{"key":"10535_CR8","unstructured":"Joseph R (2021) A survey of deep learning techniques for dynamic branch prediction. arXiv preprint arXiv:2112.14911"},{"key":"10535_CR9","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3379504","volume":"55","author":"N Wu","year":"2021","unstructured":"Wu N, Xie Y (2021) A survey of machine learning for computer architecture and systems. ACM Computing Surveys (CSUR) 55:1\u201339","journal-title":"ACM Computing Surveys (CSUR)"},{"key":"10535_CR10","doi-asserted-by":"crossref","first-page":"86230","DOI":"10.1109\/ACCESS.2020.2992643","volume":"8","author":"L Zhang","year":"2020","unstructured":"Zhang L, Wu N, Ge F, Zhou F, Yahya MR (2020) A dynamic branch predictor based on parallel structure of srnn. IEEE Access 8:86230\u201386237","journal-title":"IEEE Access"},{"issue":"1","key":"10535_CR11","doi-asserted-by":"crossref","first-page":"4666","DOI":"10.1002\/cpe.4666","volume":"31","author":"S Mittal","year":"2019","unstructured":"Mittal S (2019) A survey of techniques for dynamic branch prediction. Concurr Comput: Practice Exp 31(1):4666","journal-title":"Concurr Comput: Practice Exp"},{"key":"10535_CR12","volume-title":"Supervised by Prof","author":"Sburlan, A.-F.: Discovering predictive patterns: A study of contextual factors for next generation branch predictors. MEng Individual Project, Imperial College London, London","year":"2023","unstructured":"Sburlan, A.-F.: Discovering predictive patterns: A study of contextual factors for next generation branch predictors. MEng Individual Project, Imperial College London, London (2023) Supervised by Prof. Paul Kelly and Dr, Giuliano Casale"},{"key":"10535_CR13","doi-asserted-by":"crossref","unstructured":"Jim\u00e9nez DA, Lin C (2001) Dynamic branch prediction with perceptrons. In: Proceedings HPCA Seventh International Symposium on High-Performance Computer Architecture, pp. 197\u2013206. IEEE","DOI":"10.1109\/HPCA.2001.903263"},{"key":"10535_CR14","volume-title":"Combining branch predictors","author":"S McFarling","year":"1993","unstructured":"McFarling S (1993) Combining branch predictors. Technical report, Citeseer (June"},{"key":"10535_CR15","doi-asserted-by":"crossref","unstructured":"Tullsen DM, Eggers SJ, Levy HM (1995) Simultaneous multithreading: Maximizing on-chip parallelism. In: Proceedings of the 22nd Annual International Symposium on Computer Architecture, pp. 392\u2013403","DOI":"10.1145\/223982.224449"},{"key":"10535_CR16","doi-asserted-by":"crossref","unstructured":"Yeh T-Y, Patt YN (1991) Two-level adaptive training branch prediction. In: Proceedings of the 24th Annual International Symposium on Microarchitecture, pp. 51\u201361","DOI":"10.1145\/123465.123475"},{"key":"10535_CR17","first-page":"23","volume":"8","author":"A Seznec","year":"2006","unstructured":"Seznec A, Michaud P (2006) A case for (partially) tagged geometric history length branch prediction. J Ins-Level Parallelism 8:23","journal-title":"J Ins-Level Parallelism"},{"key":"10535_CR18","unstructured":"Seznec A (2014) Tage-sc-l branch predictors. In: JILP-Championship Branch Prediction"},{"issue":"6","key":"10535_CR19","doi-asserted-by":"crossref","first-page":"386","DOI":"10.1037\/h0042519","volume":"65","author":"F Rosenblatt","year":"1958","unstructured":"Rosenblatt F (1958) The perceptron: a probabilistic model for information storage and organization in the brain. Psychol Rev 65(6):386","journal-title":"Psychol Rev"},{"key":"10535_CR20","unstructured":"Lee C-C, Chen I-C, Mudge TN (1997) The bi-mode branch predictor. In: Proceedings of 30th Annual International Symposium on Microarchitecture, pp. 4\u201313. IEEE"},{"key":"10535_CR21","doi-asserted-by":"crossref","unstructured":"Akkary H, Srinivasan ST, Koltur R, Patil Y, Refaai W (2004) Perceptron-based branch confidence estimation. In: 10th International Symposium on High Performance Computer Architecture (HPCA\u201904), pp. 265\u2013265. IEEE","DOI":"10.1109\/HPCA.2004.10002"},{"key":"10535_CR22","doi-asserted-by":"publisher","unstructured":"Hida I, Ikebe M, Asai T, Motomura M (2016) A 2-clock-cycle na\u00efve bayes classifier for dynamic branch prediction in pipelined risc microprocessors. In: 2016 IEEE Asia Pacific Conference on Circuits and Systems (APCCAS), pp. 297\u2013300. https:\/\/doi.org\/10.1109\/APCCAS.2016.7803958","DOI":"10.1109\/APCCAS.2016.7803958"},{"key":"10535_CR23","unstructured":"Tarsa SJ, Lin C-K, Keskin G, Chinya G, Wang H (2019) Improving branch prediction by modeling global history with convolutional neural networks. arXiv preprint arXiv:1906.09889"},{"key":"10535_CR24","doi-asserted-by":"crossref","unstructured":"Ozturk C, Sendag R (2010) An analysis of hard to predict branches. IEEE International Symposium on Performance Analysis of Systems & Software (ISPASS), 213\u2013222","DOI":"10.1109\/ISPASS.2010.5452016"},{"key":"10535_CR25","doi-asserted-by":"crossref","unstructured":"Zangeneh S, Pruett S, Lym S, Patt YN (2020) Branchnet: A convolutional neural network to predict hard-to-predict branches. In: 2020 53rd Annual IEEE\/ACM International Symposium on Microarchitecture (MICRO), pp. 118\u2013130. IEEE","DOI":"10.1109\/MICRO50266.2020.00022"},{"key":"10535_CR26","unstructured":"Seznec A (2016) Exploring branch predictability limits with the mtage+ sc predictor. In: 5th JILP Workshop on Computer Architecture Competitions (JWAC-5): Championship Branch Prediction (CBP-5), p. 4"},{"key":"10535_CR27","unstructured":"Zangeneh S, Pruett S, Patt Y (2020) Branch prediction with multilayer neural networks: The value of specialization. In: Machine Learning for Computer Architecture and Systems. National Science Foundation. NSF-PAR ID: 10249272"},{"key":"10535_CR28","volume-title":"Exp deep neural net branch prediction","author":"Y Mao","year":"2017","unstructured":"Mao Y, Huiyang Z, Gui X (2017) Exp deep neural net branch prediction. NC University, ECE Department"},{"key":"10535_CR29","unstructured":"Zouzias A, Kalaitzidis K, Grot B (2021) Branch prediction as a reinforcement learning problem: Why, how and case studies. arXiv preprint arXiv:2106.13429"},{"key":"10535_CR30","doi-asserted-by":"crossref","DOI":"10.1016\/j.neucom.2023.126637","volume":"555","author":"LA Villon","year":"2023","unstructured":"Villon LA, Susskind Z, Bacellar AT, Miranda ID, Ara\u00fajo LS, Lima PM, Breternitz M Jr, John LK, Fran\u00e7a FM, Dutra DL (2023) A conditional branch predictor based on weightless neural networks. Neurocomputing 555:126637","journal-title":"Neurocomputing"},{"issue":"3","key":"10535_CR31","doi-asserted-by":"crossref","first-page":"120","DOI":"10.1108\/eb007637","volume":"4","author":"I Aleksander","year":"1984","unstructured":"Aleksander I, Thomas W, Bowden P (1984) Wisard\u00b7 a radical step forward in image recognition. Sens Rev 4(3):120\u2013124","journal-title":"Sens Rev"},{"key":"10535_CR32","unstructured":"Shkadarevich D (2020) Branch Prediction Dataset. https:\/\/www.kaggle.com\/datasets\/dmitryshkadarevich\/branch-prediction"},{"key":"10535_CR33","unstructured":"Devlin J, Chang M, Lee K, Toutanova K (2018) BERT: pre-training of deep bidirectional transformers for language understanding. CoRR abs\/1810.04805[SPACE]https:\/\/arxiv.org\/abs\/1810.04805 1810.04805"},{"key":"10535_CR34","unstructured":"Bahdanau D, Cho K, Bengio Y (2014) Neural machine translation by jointly learning to align and translate. arXiv preprint arXiv:1409.0473"},{"key":"10535_CR35","doi-asserted-by":"crossref","unstructured":"Bhargava P, Drozd A, Rogers A (2021) Generalization in NLI: Ways (Not) To Go Beyond Simple Heuristics","DOI":"10.18653\/v1\/2021.insights-1.18"},{"key":"10535_CR36","unstructured":"Turc I, Chang M, Lee K, Toutanova K (2019) Well-read students learn better: The impact of student initialization on knowledge distillation. CoRR abs\/1908.08962[SPACE]https:\/\/arxiv.org\/abs\/1908.089621908.08962"},{"key":"10535_CR37","unstructured":"Alajmi A. Anwaarma\/BP-balanced. datasets at hugging face. https:\/\/huggingface.co\/datasets\/Anwaarma\/BP-balanced"},{"key":"10535_CR38","unstructured":"Lundberg SM, Lee S-I (2017) A unified approach to interpreting model predictions. Advances in neural information processing systems 30"},{"key":"10535_CR39","doi-asserted-by":"crossref","unstructured":"Wang Y, Fan H, Li S, Liang T, Zhang W (2024) A modular branch predictor performance analysis framework for fast design space exploration. In: 2024 Design, Automation & Test in Europe Conference & Exhibition (DATE), pp. 1\u20136. IEEE","DOI":"10.23919\/DATE58400.2024.10546853"},{"key":"10535_CR40","doi-asserted-by":"crossref","unstructured":"Jamet AV, Vavouliotis G, Jim\u00e9nez DA, Alvarez L, Casas M (2024) A two level neural approach combining off-chip prediction with adaptive prefetch filtering. In: 2024 IEEE International Symposium on High-Performance Computer Architecture (HPCA), pp. 528\u2013542. IEEE","DOI":"10.1109\/HPCA57654.2024.00046"}],"container-title":["Neural Computing and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00521-024-10535-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00521-024-10535-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00521-024-10535-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,5]],"date-time":"2025-02-05T21:48:48Z","timestamp":1738792128000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00521-024-10535-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,20]]},"references-count":40,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2025,2]]}},"alternative-id":["10535"],"URL":"https:\/\/doi.org\/10.1007\/s00521-024-10535-1","relation":{},"ISSN":["0941-0643","1433-3058"],"issn-type":[{"type":"print","value":"0941-0643"},{"type":"electronic","value":"1433-3058"}],"subject":[],"published":{"date-parts":[[2024,11,20]]},"assertion":[{"value":"4 March 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 October 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 November 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}