{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,25]],"date-time":"2026-04-25T17:27:41Z","timestamp":1777138061810,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":61,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,8,18]],"date-time":"2021-08-18T00:00:00Z","timestamp":1629244800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"Swiss National Science Foundation","award":["200021_197227"],"award-info":[{"award-number":["200021_197227"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,8,20]]},"DOI":"10.1145\/3468264.3468606","type":"proceedings-article","created":{"date-parts":[[2021,8,19]],"date-time":"2021-08-19T01:40:03Z","timestamp":1629337203000},"page":"932-944","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":38,"title":["Authorship attribution of source code: a language-agnostic approach and applicability in software engineering"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3499-2402","authenticated-orcid":false,"given":"Egor","family":"Bogomolov","sequence":"first","affiliation":[{"name":"JetBrains Research, Russia \/ HSE University, Russia"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5880-7323","authenticated-orcid":false,"given":"Vladimir","family":"Kovalenko","sequence":"additional","affiliation":[{"name":"JetBrains Research, Netherlands"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yurii","family":"Rebryk","sequence":"additional","affiliation":[{"name":"HSE University, Russia"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0193-6823","authenticated-orcid":false,"given":"Alberto","family":"Bacchelli","sequence":"additional","affiliation":[{"name":"University of Zurich, Switzerland"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9022-3563","authenticated-orcid":false,"given":"Timofey","family":"Bryksin","sequence":"additional","affiliation":[{"name":"JetBrains Research, Russia \/ HSE University, Russia"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2021,8,18]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"2018. The State of the Octoverse. https:\/\/octoverse.github.com\/  2018. The State of the Octoverse. https:\/\/octoverse.github.com\/"},{"key":"e_1_3_2_1_2_1","unstructured":"2020. Google Style Guides. http:\/\/google.github.io\/styleguide\/  2020. Google Style Guides. http:\/\/google.github.io\/styleguide\/"},{"key":"e_1_3_2_1_3_1","unstructured":"2020. Gradle. https:\/\/github.com\/gradle\/gradle  2020. Gradle. https:\/\/github.com\/gradle\/gradle"},{"key":"e_1_3_2_1_4_1","unstructured":"2020. IntelliJ Community. https:\/\/github.com\/jetbrains\/intellij-community  2020. IntelliJ Community. https:\/\/github.com\/jetbrains\/intellij-community"},{"key":"e_1_3_2_1_5_1","unstructured":"2020. JetBrains Research GitHub: Authorship Detection. https:\/\/github.com\/JetBrains-Research\/authorship-detection  2020. JetBrains Research GitHub: Authorship Detection. https:\/\/github.com\/JetBrains-Research\/authorship-detection"},{"key":"e_1_3_2_1_6_1","unstructured":"2020. ML in Programming GitHub: PSO Authorship Detection. https:\/\/github.com\/ml-in-programming\/ml-on-source-code-models\/tree\/master\/psob_authorship  2020. ML in Programming GitHub: PSO Authorship Detection. https:\/\/github.com\/ml-in-programming\/ml-on-source-code-models\/tree\/master\/psob_authorship"},{"key":"e_1_3_2_1_7_1","unstructured":"2020. Mule. https:\/\/github.com\/mulesoft\/mule  2020. Mule. https:\/\/github.com\/mulesoft\/mule"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/2635868.2635883"},{"key":"e_1_3_2_1_9_1","volume-title":"code2seq: Generating Sequences from Structured Representations of Code. CoRR, abs\/1808.01400","author":"Alon Uri","year":"2018","unstructured":"Uri Alon , Omer Levy , and Eran Yahav . 2018. code2seq: Generating Sequences from Structured Representations of Code. CoRR, abs\/1808.01400 ( 2018 ), arxiv:1808.01400. arxiv:1808.01400 Uri Alon, Omer Levy, and Eran Yahav. 2018. code2seq: Generating Sequences from Structured Representations of Code. CoRR, abs\/1808.01400 (2018), arxiv:1808.01400. arxiv:1808.01400"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/3296979.3192412"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/3290353"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"crossref","unstructured":"B. Alsulami E. Dauber R. Harang S. Mancoridis and R. Greenstadt. 2017. Source Code Authorship Attribution Using Long Short-Term Memory Based Networks. In Computer Security \u2013 ESORICS 2017 S. N. Foley D. Gollmann and E. Snekkenes (Eds.). Springer International Publishing Cham. 65\u201382. isbn:978-3-319-66402-6  B. Alsulami E. Dauber R. Harang S. Mancoridis and R. Greenstadt. 2017. Source Code Authorship Attribution Using Long Short-Term Memory Based Networks. In Computer Security \u2013 ESORICS 2017 S. N. Foley D. Gollmann and E. Snekkenes (Eds.). Springer International Publishing Cham. 65\u201382. isbn:978-3-319-66402-6","DOI":"10.1007\/978-3-319-66402-6_6"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/1134285.1134336"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10664-018-9650-5"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1145\/1137983.1138016"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/2025113.2025119"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/MSR.2009.5069475"},{"key":"e_1_3_2_1_18_1","volume-title":"ADCS 2007 - Proceedings of the Twelfth Australasian Document Computing Symposium, Jan..","author":"Burrows S.","year":"2007","unstructured":"S. Burrows and S.M.M. Tahaghoghi . 2007 . Source code authorship attribution using n-grams . ADCS 2007 - Proceedings of the Twelfth Australasian Document Computing Symposium, Jan.. S. Burrows and S.M.M. Tahaghoghi. 2007. Source code authorship attribution using n-grams. ADCS 2007 - Proceedings of the Twelfth Australasian Document Computing Symposium, Jan.."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1002\/spe.2146"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/COMPSAC.2009.85"},{"key":"e_1_3_2_1_21_1","volume-title":"24th USENIX Security Symposium (USENIX Security 15)","author":"Caliskan-Islam A.","year":"1971","unstructured":"A. Caliskan-Islam , R. Harang , A. Liu , A. Narayanan , C. Voss , F. Yamaguchi , and R. Greenstadt . 2015. De-anonymizing Programmers via Code Stylometry . In 24th USENIX Security Symposium (USENIX Security 15) . USENIX Association, Washington, D.C.. 255\u2013270. isbn:978-1-93 1971 -232 https:\/\/www.usenix.org\/conference\/usenixsecurity15\/technical-sessions\/presentation\/caliskan-islam A. Caliskan-Islam, R. Harang, A. Liu, A. Narayanan, C. Voss, F. Yamaguchi, and R. Greenstadt. 2015. De-anonymizing Programmers via Code Stylometry. In 24th USENIX Security Symposium (USENIX Security 15). USENIX Association, Washington, D.C.. 255\u2013270. isbn:978-1-931971-232 https:\/\/www.usenix.org\/conference\/usenixsecurity15\/technical-sessions\/presentation\/caliskan-islam"},{"key":"e_1_3_2_1_22_1","volume-title":"Thomas","author":"Cover Thomas M.","year":"1991","unstructured":"Thomas M. Cover and Joy A . Thomas . 1991 . Elements of Information Theory. Wiley-Interscience , USA. isbn:0471062596 Thomas M. Cover and Joy A. Thomas. 1991. Elements of Information Theory. Wiley-Interscience, USA. isbn:0471062596"},{"key":"e_1_3_2_1_23_1","first-page":"50","article-title":"Detecting Outsourced Student Programming Assignments","volume":"23","author":"Elenbogen B. S.","year":"2008","unstructured":"B. S. Elenbogen and N. Seliya . 2008 . Detecting Outsourced Student Programming Assignments . J. Comput. Sci. Coll. , 23 , 3 (2008), Jan. , 50 \u2013 57 . issn:1937-4771 http:\/\/dl.acm.org\/citation.cfm?id=1295109.1295123 B. S. Elenbogen and N. Seliya. 2008. Detecting Outsourced Student Programming Assignments. J. Comput. Sci. Coll., 23, 3 (2008), Jan., 50\u201357. issn:1937-4771 http:\/\/dl.acm.org\/citation.cfm?id=1295109.1295123","journal-title":"J. Comput. Sci. Coll."},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/2642937.2642982"},{"key":"e_1_3_2_1_25_1","volume-title":"Identifying Authorship by Byte-Level N-Grams: The Source Code Author Profile (SCAP) Method.. IJDE, 6","author":"Frantzeskou G.","year":"2007","unstructured":"G. Frantzeskou , E. Stamatatos , S. Gritzalis , C. Chaski , and Blake Stephen H.. 2007. Identifying Authorship by Byte-Level N-Grams: The Source Code Author Profile (SCAP) Method.. IJDE, 6 ( 2007 ), Jan.. G. Frantzeskou, E. Stamatatos, S. Gritzalis, C. Chaski, and Blake Stephen H.. 2007. Identifying Authorship by Byte-Level N-Grams: The Source Code Author Profile (SCAP) Method.. IJDE, 6 (2007), Jan.."},{"key":"e_1_3_2_1_26_1","unstructured":"G. Frantzeskou E. Stamatatos S. Gritzalis and S. Katsikas. 2006. Source Code Author Identification Based on N-gram Author Profiles. In Artificial Intelligence Applications and Innovations I. Maglogiannis K. Karpouzis and M. Bramer (Eds.). Springer US Boston MA. 508\u2013515. isbn:978-0-387-34224-5  G. Frantzeskou E. Stamatatos S. Gritzalis and S. Katsikas. 2006. Source Code Author Identification Based on N-gram Author Profiles. In Artificial Intelligence Applications and Innovations I. Maglogiannis K. Karpouzis and M. Bramer (Eds.). Springer US Boston MA. 508\u2013515. isbn:978-0-387-34224-5"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/1806799.1806856"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1109\/IWPSE.2005.21"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/3379597.3387455"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/3292577"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICSE.2015.74"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/2597073.2597074"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICNN.1995.488968"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/ITNG.2007.17"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICSM.2012.6405329"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-4048(97)00005-9"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1145\/1276958.1277364"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1109\/ecrime.2010.5706698"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1145\/1150402.1150522"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1145\/3133908"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"crossref","unstructured":"Peter S. Menell. 2017. API Copyrightability Bleak House: Unraveling and Repairing the Oracle v. Google Jurisdictional Mess. Berkeley Technology Law Journal 30 April.  Peter S. Menell. 2017. API Copyrightability Bleak House: Unraveling and Repairing the Oracle v. Google Jurisdictional Mess. Berkeley Technology Law Journal 30 April.","DOI":"10.2139\/ssrn.2859740"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2018.2871083"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/2950290.2983962"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1145\/75427.75469"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1145\/382222.382462"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.5555\/1953048.2078195"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.1109\/MSR.2019.00078"},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.1145\/1985793.1985860"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1145\/1082983.1083162"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1145\/2001420.2001433"},{"key":"e_1_3_2_1_51_1","volume-title":"Proceedings of the 16th European Conference on Research in Computer Security (ESORICS\u201911)","author":"Rosenblum N.","year":"2041","unstructured":"N. Rosenblum , X. Zhu , and B. P. Miller . 2011. Who Wrote This Code? Identifying the Authors of Program Binaries . In Proceedings of the 16th European Conference on Research in Computer Security (ESORICS\u201911) . Springer-Verlag, Berlin, Heidelberg. 172\u2013189. isbn:978-3-642-23821-5 http:\/\/dl.acm.org\/citation.cfm?id= 2041 225.2041239 N. Rosenblum, X. Zhu, and B. P. Miller. 2011. Who Wrote This Code? Identifying the Authors of Program Binaries. In Proceedings of the 16th European Conference on Research in Computer Security (ESORICS\u201911). Springer-Verlag, Berlin, Heidelberg. 172\u2013189. isbn:978-3-642-23821-5 http:\/\/dl.acm.org\/citation.cfm?id=2041225.2041239"},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","DOI":"10.1002\/j.1538-7305.1948.tb01338.x"},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.1109\/SSBSE.2009.18"},{"key":"e_1_3_2_1_54_1","doi-asserted-by":"publisher","DOI":"10.1515\/popets-2018-0007"},{"key":"e_1_3_2_1_55_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10579-010-9115-y"},{"key":"e_1_3_2_1_56_1","doi-asserted-by":"publisher","DOI":"10.1145\/2884781.2884852"},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"publisher","DOI":"10.2307\/3001968"},{"key":"e_1_3_2_1_58_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10664-018-9634-5"},{"key":"e_1_3_2_1_59_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0187204"},{"key":"e_1_3_2_1_60_1","doi-asserted-by":"publisher","DOI":"10.1145\/2025113.2025121"},{"key":"e_1_3_2_1_61_1","doi-asserted-by":"crossref","unstructured":"C. Zhang S. Wang J. Wu and Z. Niu. 2017. Authorship Identification of Source Codes. In APWeb\/WAIM.  C. Zhang S. Wang J. Wu and Z. Niu. 2017. Authorship Identification of Source Codes. In APWeb\/WAIM.","DOI":"10.1007\/978-3-319-63579-8_22"}],"event":{"name":"ESEC\/FSE '21: 29th ACM Joint European Software Engineering Conference and Symposium on the Foundations of Software Engineering","location":"Athens Greece","acronym":"ESEC\/FSE '21","sponsor":["SIGSOFT ACM Special Interest Group on Software Engineering"]},"container-title":["Proceedings of the 29th ACM Joint Meeting on European Software Engineering Conference and Symposium on the Foundations of Software Engineering"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3468264.3468606","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3468264.3468606","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T21:24:51Z","timestamp":1750195491000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3468264.3468606"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,8,18]]},"references-count":61,"alternative-id":["10.1145\/3468264.3468606","10.1145\/3468264"],"URL":"https:\/\/doi.org\/10.1145\/3468264.3468606","relation":{},"subject":[],"published":{"date-parts":[[2021,8,18]]},"assertion":[{"value":"2021-08-18","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}