{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T01:05:49Z","timestamp":1740099949203,"version":"3.37.3"},"reference-count":42,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,12,7]],"date-time":"2020-12-07T00:00:00Z","timestamp":1607299200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,12,7]],"date-time":"2020-12-07T00:00:00Z","timestamp":1607299200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,12,7]],"date-time":"2020-12-07T00:00:00Z","timestamp":1607299200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100005735","name":"Tamkang University (TKU)","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100005735","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100007225","name":"Ministry of Science and Technology (MOST)","doi-asserted-by":"publisher","award":["109-2221-E-324-024"],"award-info":[{"award-number":["109-2221-E-324-024"]}],"id":[{"id":"10.13039\/100007225","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,12,7]]},"DOI":"10.1109\/asonam49781.2020.9381329","type":"proceedings-article","created":{"date-parts":[[2021,3,24]],"date-time":"2021-03-24T20:17:37Z","timestamp":1616617057000},"page":"919-925","source":"Crossref","is-referenced-by-count":0,"title":["Fine-tuning techniques and data augmentation on transformer-based models for conversational texts and noisy user-generated content"],"prefix":"10.1109","author":[{"given":"Mike Tian-Jian","family":"Jiang","sequence":"first","affiliation":[]},{"given":"Shih-Hung","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Yi-Kun","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Zhao-Xian","family":"Gu","sequence":"additional","affiliation":[]},{"given":"Cheng-Jhe","family":"Chiang","sequence":"additional","affiliation":[]},{"given":"Yueh-Chia","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Yu-Chen","family":"Huang","sequence":"additional","affiliation":[]},{"given":"Cheng-Han","family":"Chiu","sequence":"additional","affiliation":[]},{"given":"Sheng-Ru","family":"Shaw","sequence":"additional","affiliation":[]},{"given":"Min-Yuh","family":"Day","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","article-title":"Overview of the NTCIR-15 Dialogue Evaluation (DialEval-1) Task","author":"zeng","year":"0","journal-title":"Proceedings of the 15th NTCIR Conference on Evaluation of Information Access Technologies"},{"key":"ref38","article-title":"Overview of the NTCIR-14 short text conversation task: Dialogue quality and nugget detection subtasks","author":"zeng","year":"0","journal-title":"Proceedings of the 14th NTCIR Conference on Evaluation of Information Access Technologies"},{"key":"ref33","article-title":"Google's Neural Machine Translation System: Bridging the Gap between Human and Machine Translation","volume":"abs 1609 8144","author":"wu","year":"2016","journal-title":"CoRR"},{"key":"ref32","article-title":"HuggingFace's Transformers: State-of-the-art Natural Language Processing","volume":"abs 1910 3771","author":"wolf","year":"2019","journal-title":"CoRR"},{"key":"ref31","first-page":"271","article-title":"PARADISE: A Framework for Evaluating Spoken Dialogue Agents","author":"walker","year":"1997","journal-title":"35th Annual Meeting of the Association for Computational Linguistics and 8th Conference of the European Chapter of the Association for Computational Linguistics"},{"journal-title":"A disciplined approach to neural network hyperparameters Part 1 - learning rate batch size momentum and weight decay","year":"2018","author":"smith","key":"ref30"},{"key":"ref37","article-title":"Large Batch Optimization for Deep Learning: Training BERT in 76 minutes","author":"you","year":"0","journal-title":"International Conference on Learning Representations"},{"journal-title":"Large batch training of convolutional networks","year":"2017","author":"you","key":"ref36"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_37"},{"key":"ref34","article-title":"WUST at the NTCIR-14 STC-3 Dialogue Quality and Nugget Detection Subtask","author":"yan","year":"0","journal-title":"Proceedings of the 14th NTCIR Conference on Evaluation of Information Access Technologies"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.3390\/info11020108"},{"key":"ref40","first-page":"9597","article-title":"Lookahead optimizer: k steps forward, 1 step back","author":"zhang","year":"0","journal-title":"Advances in neural information processing systems"},{"journal-title":"Deep learning for coders with fastai and PyTorch AI applications without a PhD","year":"2020","author":"howard","key":"ref11"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1031"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-60290-1_21"},{"key":"ref14","article-title":"SLSTC at the NTCIR-14 STC-3 dialogue quality and nugget detection subtasks","author":"kato","year":"0","journal-title":"Proceedings of the 14th NTCIR Conference on Evaluation of Information Access Technologies"},{"journal-title":"CTRL A Conditional Transformer Language Model for Controllable Generation","year":"2019","author":"keskar","key":"ref15"},{"key":"ref16","article-title":"Adam: A Method for Stochastic Optimization","author":"kingma","year":"2015","journal-title":"3rd International Conference on Learning Representations ICLR 2015"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1007"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D18-2012"},{"key":"ref19","article-title":"Cross-lingual Language Model Pretraining","author":"lample","year":"0","journal-title":"Advances in Neural IInformation Processing Systems"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P16-1162"},{"key":"ref4","article-title":"CUIS at the NTCIR-14 STC-3 DQ Subtask","author":"cong","year":"0","journal-title":"Proceedings of the 14th NTCIR Conference on Evaluation of Information Access Technologies"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W19-4302"},{"key":"ref3","article-title":"Dialogue quality and nugget detection for short text conversation (STC-3) based on hierarchical multi-stack model with memory enhance structure","author":"cherng","year":"0","journal-title":"Proceedings of the 14th NTCIR Conference on Evaluation of Information Access Technologies"},{"journal-title":"Pre-training with whole word masking for chinese bert","year":"2019","author":"cui","key":"ref6"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/WACV.2017.58"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.747"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/j.neunet.2005.06.042"},{"key":"ref7","first-page":"4171","article-title":"BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding","volume":"1","author":"devlin","year":"2019","journal-title":"Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics Human Language Technologies"},{"journal-title":"Language models are few-shot learners","year":"2020","author":"brown","key":"ref2"},{"key":"ref1","first-page":"622","article-title":"Assessing Dialog System User Simulation Evaluation Measures Using Human Judges","author":"ai","year":"2020","journal-title":"Proceedings of ACL-08 HLT Association for Computational Linguistics"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref20","article-title":"On the Variance of the Adaptive Learning Rate and Beyond","author":"liu","year":"0","journal-title":"International Conference on Learning Representations"},{"key":"ref22","article-title":"Regularizing and Optimizing LSTM Language Models","author":"merity","year":"0","journal-title":"International Conference on Learning Representations"},{"key":"ref21","article-title":"RoBERTa: A Robustly Optimized BERT Pretraining Approach","volume":"abs 1907 11692","author":"liu","year":"2019","journal-title":"CoRR"},{"key":"ref24","first-page":"4694","article-title":"When does label smoothing help?","author":"m\u00fcller","year":"0","journal-title":"Advances in neural information processing systems"},{"key":"ref42","article-title":"Overview of the NTCIR-15 FinNum-2 Task: Numeral Attachment in Financial Tweets","author":"chen","year":"0","journal-title":"Proceedings of the 15th NTCIR Conference on Evaluation of Information Access Technologies"},{"key":"ref23","article-title":"An Analysis of Neural Language Modeling at Multiple Scales","volume":"abs 1803 8240","author":"merity","year":"2018","journal-title":"CoRR"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-36805-0_14"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1162"},{"key":"ref25","first-page":"1116","article-title":"Towards an Automatic Turing Test: Learning to Evaluate Dialogue Responses","author":"michael","year":"2017","journal-title":"Proceedings of the 55th Annual Meeting of the Association for Computational Linguistics (Volume 1 Long Papers)"}],"event":{"name":"2020 IEEE\/ACM International Conference on Advances in Social Networks Analysis and Mining (ASONAM)","start":{"date-parts":[[2020,12,7]]},"location":"The Hague, Netherlands","end":{"date-parts":[[2020,12,10]]}},"container-title":["2020 IEEE\/ACM International Conference on Advances in Social Networks Analysis and Mining (ASONAM)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9381192\/9381291\/09381329.pdf?arnumber=9381329","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,27]],"date-time":"2022-06-27T15:39:16Z","timestamp":1656344356000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9381329\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,12,7]]},"references-count":42,"URL":"https:\/\/doi.org\/10.1109\/asonam49781.2020.9381329","relation":{},"subject":[],"published":{"date-parts":[[2020,12,7]]}}}