{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T14:15:46Z","timestamp":1730297746695,"version":"3.28.0"},"reference-count":81,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,11,21]],"date-time":"2023-11-21T00:00:00Z","timestamp":1700524800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,11,21]],"date-time":"2023-11-21T00:00:00Z","timestamp":1700524800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,11,21]]},"DOI":"10.1109\/snams60348.2023.10375471","type":"proceedings-article","created":{"date-parts":[[2024,1,2]],"date-time":"2024-01-02T15:36:22Z","timestamp":1704209782000},"page":"1-9","source":"Crossref","is-referenced-by-count":2,"title":["The Batch Primary Components Transformer and Auto-Plasticity Learning Linear Units Architecture: Synthetic Image Generation Case"],"prefix":"10.1109","author":[{"given":"Stanislav","family":"Selitskiy","sequence":"first","affiliation":[{"name":"School Of Computer Science And Technology, University of Bedfordshire,Luton,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chihiro","family":"Inoue","sequence":"additional","affiliation":[{"name":"University of Bedfordshire,Centre For Research In English Language Learning And Assessment,Luton,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Vitaly","family":"Schetinin","sequence":"additional","affiliation":[{"name":"School Of Computer Science And Technology, University of Bedfordshire,Luton,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Livija","family":"Jakaite","sequence":"additional","affiliation":[{"name":"School Of Computer Science And Technology, University of Bedfordshire,Luton,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"volume-title":"GPT-4","year":"2023","key":"ref1"},{"volume-title":"Pathways Language Model (PaLM): Scaling to 540 Billion Parameters for Breakthrough Performance","year":"2023","key":"ref2"},{"key":"ref3","article-title":"Palm: Scaling language modeling with pathways","author":"Chowdhery","year":"2022","journal-title":"arXiv preprint"},{"key":"ref4","article-title":"Llama: Open and efficient foundation language models","author":"Touvron","year":"2023","journal-title":"arXiv preprint"},{"key":"ref5","article-title":"Detecting llm-generated text in computing education: A comparative study for chatgpt cases","author":"Orenstrakh","year":"2023","journal-title":"arXiv preprint"},{"key":"ref6","article-title":"The science of detecting llm-generated texts","volume-title":"arXiv preprint","author":"Tang","year":"2023"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/3587102.3588792"},{"key":"ref8","first-page":"2022","article-title":"Comparing scientific abstracts generated by chatgpt to original abstracts using an artificial intelligence output detector, plagiarism detector, and blinded human reviewers","volume-title":"BioRxiv","author":"Gao","year":"2022"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-94890-0_9"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.5465\/AMBPP.2022.17063abstract"},{"key":"ref11","article-title":"Chatgpt or human? detect and explain. explaining decisions of machine learning model for detecting short chatgpt-generated text","author":"Mitrovi\u0107","year":"2023","journal-title":"arXiv preprint"},{"key":"ref12","first-page":"515","article-title":"Can chatgpt detect student talk moves in classroom discourse? a preliminary comparison with bert","volume-title":"Proceedings of the 16th International Conference on Educational Data Mining","author":"Wang","year":"Jul 2023"},{"key":"ref13","article-title":"Is reinforcement learning (not) for natural language processing?: Benchmarks, baselines, and building blocks for natural language policy optimization","author":"Ramamurthy","year":"2022","journal-title":"arXiv preprint"},{"key":"ref14","article-title":"Grounding large language models in interactive environments with online reinforcement learning","author":"Carta","year":"2023","journal-title":"arXiv preprint"},{"key":"ref15","article-title":"On the uses of large language models to interpret ambiguous cyberattack descriptions","author":"Fayyazi","year":"2023","journal-title":"arXiv preprint"},{"key":"ref16","article-title":"Mathematical capabilities of chatgpt","author":"Frieder","year":"2023","journal-title":"arXiv preprint"},{"key":"ref17","article-title":"A categorical archive of chatgpt failures","author":"Borji","year":"2023","journal-title":"arXiv preprint"},{"key":"ref18","article-title":"ChatGPT is no stochastic parrot. But it also claims 1 > 1. | Medium","volume-title":"Medium","author":"Arkoudas","year":"2023"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W19-3805"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W19-3823"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1339"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.findings-emnlp.301"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.463"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1037\/rev0000297"},{"volume-title":"A very preliminary analysis of dall-e 2","year":"2022","author":"Marcus","key":"ref25"},{"key":"ref26","article-title":"Pitfalls of static language modelling","author":"Lazaridou","year":"2021","journal-title":"arXiv preprint"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3447548.3467162"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00459"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1016\/s0079-7421(08)60536-8"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1016\/S1364-6613(99)01294-2"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9561165"},{"journal-title":"Generalized out-of-distribution detection: A survey","year":"2022","author":"Yang","key":"ref32"},{"key":"ref33","article-title":"Is learning the n-th thing any easier than learning the first?","volume":"8","author":"Thrun","year":"1995","journal-title":"Advances in neural information processing systems"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01252-6_33"},{"key":"ref35","article-title":"Continual backprop: Stochastic gradient descent with persistent randomness","author":"Dohare","year":"2021","journal-title":"arXiv preprint"},{"key":"ref36","first-page":"3884","article-title":"On warm-starting neural network training","volume":"33","author":"Ash","year":"2020","journal-title":"Advances in neural information processing systems"},{"key":"ref37","article-title":"A study on the plasticity of neural networks","author":"Berariu","year":"2021","journal-title":"arXiv preprint"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1037\/0033-295x.97.2.285"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.1611835114"},{"key":"ref40","article-title":"Loss of plasticity in continual deep reinforcement learning","author":"Abbas","year":"2023","journal-title":"arXiv preprint"},{"key":"ref41","article-title":"Muril: Multilingual representations for indian languages","author":"Khanuja","year":"2021","journal-title":"arXiv preprint"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.121598"},{"key":"ref43","article-title":"How good is your tokenizer? on the monolingual performance of multilingual language models","author":"Rust","year":"2020","journal-title":"arXiv preprint"},{"key":"ref44","first-page":"94","article-title":"Reducing tokenizers tokens per word ratio in financial domain with t-mufin bert tokenizer","volume-title":"Proceedings of the Fifth Workshop on Financial Technology and Natural Language Processing and the Second Multimodal AI For Financial Forecasting","author":"Gopalakrishnan"},{"volume-title":"Practical text analytics: Interpreting text and unstructured data for business intelligence","year":"2015","author":"Struhl","key":"ref45"},{"key":"ref46","article-title":"Introduction to the bag of features paradigm for image classification and retrieval","author":"OHara","year":"2011","journal-title":"arXiv preprint"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1007\/s13042-010-0001-0"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1177\/107769905303000401"},{"key":"ref49","article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","author":"Devlin","year":"2018","journal-title":"arXiv preprint"},{"issue":"4","key":"ref50","first-page":"467","article-title":"Class-based n-gram models of natural language","volume":"18","author":"Brown","year":"1992","journal-title":"Computational linguistics"},{"key":"ref51","article-title":"Masked language model scoring","author":"Salazar","year":"2019","journal-title":"arXiv preprint"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.2307\/2987782"},{"key":"ref53","article-title":"Neural machine translation by jointly learning to align and translate","author":"Bahdanau","year":"2014","journal-title":"arXiv preprint"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D15-1166"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/p17-1012"},{"key":"ref56","article-title":"Attention is all you need","volume-title":"CoRR, vol. abs\/1706.03762","author":"Vaswani","year":"2017"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1145\/3442188.3445922"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.naacl-main.185"},{"key":"ref59","article-title":"Deep learning: A critical appraisal","volume-title":"CoRR","author":"Marcus","year":"2018"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1016\/j.tcs.2021.10.020"},{"key":"ref61","article-title":"Mathematical structure of syntactic merge","author":"Marcolli","year":"2023","journal-title":"arXiv preprint"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1163\/23526416-bja10040"},{"key":"ref63","first-page":"3","article-title":"Rethinking universality","author":"Watumull","year":"2020","journal-title":"Syntactic architecture and its consequences II"},{"key":"ref64","article-title":"Neural networks and the chomsky hierarchy","author":"Del\u00e9tang","year":"2022","journal-title":"arXiv preprint"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00324"},{"key":"ref66","article-title":"Lifelong learning with dynamically expandable networks","author":"Yoon","year":"2017","journal-title":"arXiv preprint"},{"key":"ref67","article-title":"Continual learning via neural pruning","author":"Golkar","year":"2019","journal-title":"arXiv preprint"},{"key":"ref68","article-title":"Random path selection for continual learning","volume":"32","author":"Rajasegaran","year":"2019","journal-title":"Advances in Neural Information Processing Systems"},{"journal-title":"Online continual learning with maximally interfered retrieval","year":"2019","author":"Aljundi","key":"ref69"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1515\/9781400881970-018"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i11.17159"},{"key":"ref72","article-title":"Learning to learn without forgetting by maximizing transfer and minimizing interference","author":"Riemer","year":"2018","journal-title":"arXiv preprint"},{"journal-title":"Loss of plasticity in deep continual learning","year":"2023","author":"Dohare","key":"ref73"},{"key":"ref74","first-page":"2217","article-title":"Understanding and improving convolutional neural networks via concatenated rectified linear units","volume-title":"international conference on machine learning","author":"Shang"},{"key":"ref75","article-title":"Radial basis functions, multi-variable functional interpolation and adaptive networks","author":"Broomhead","year":"1988","journal-title":"Royal Signals and Radar Establishment Malvern (United Kingdom), Tech. Rep."},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1090\/trans2\/017\/12"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1989.1.4.465"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1991.3.4.617"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1017\/S0962492900002919"},{"volume-title":"MNIST handwritten digit database, Yann LeCun, Corinna Cortes and Chris Burges","year":"2013","key":"ref80"},{"volume-title":"Load MNIST database in Matlab | Lulus blog","year":"2023","key":"ref81"}],"event":{"name":"2023 Tenth International Conference on Social Networks Analysis, Management and Security (SNAMS)","start":{"date-parts":[[2023,11,21]]},"location":"Abu Dhabi, United Arab Emirates","end":{"date-parts":[[2023,11,24]]}},"container-title":["2023 Tenth International Conference on Social Networks Analysis, Management and Security (SNAMS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10375374\/10375393\/10375471.pdf?arnumber=10375471","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,12]],"date-time":"2024-01-12T18:58:37Z","timestamp":1705085917000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10375471\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,11,21]]},"references-count":81,"URL":"https:\/\/doi.org\/10.1109\/snams60348.2023.10375471","relation":{},"subject":[],"published":{"date-parts":[[2023,11,21]]}}}