{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,8]],"date-time":"2026-04-08T06:13:59Z","timestamp":1775628839099,"version":"3.50.1"},"reference-count":39,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,12,3]],"date-time":"2025-12-03T00:00:00Z","timestamp":1764720000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,12,3]],"date-time":"2025-12-03T00:00:00Z","timestamp":1764720000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,12,3]]},"DOI":"10.1109\/icmla66185.2025.00134","type":"proceedings-article","created":{"date-parts":[[2026,4,7]],"date-time":"2026-04-07T19:54:58Z","timestamp":1775591698000},"page":"899-904","source":"Crossref","is-referenced-by-count":0,"title":["A Reward-Driven Controller for Text Generation with Black-Box Language Models"],"prefix":"10.1109","author":[{"given":"Robert","family":"Morain","sequence":"first","affiliation":[{"name":"Brigham Young University,Department of Computer Science"}]},{"given":"Dan","family":"Ventura","sequence":"additional","affiliation":[{"name":"Brigham Young University,Department of Computer Science"}]}],"member":"263","reference":[{"key":"ref1","first-page":"1877","article-title":"Language models are few-shot learners","author":"Brown","year":"2020","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.5040\/9781501365072.09396"},{"key":"ref3","article-title":"Fine-tuning language models from human preferences","volume":"abs\/1909.08593","author":"Ziegler","year":"2019","journal-title":"CoRR"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.52202\/068431-2011"},{"key":"ref5","article-title":"DeepSeek-R1: Incentivizing reasoning capability in LLMs via reinforcement learning","year":"2025"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3617680"},{"key":"ref7","article-title":"CTRL: A conditional transformer language model for controllable generation","volume":"abs\/1909.05858","author":"Keskar","year":"2019","journal-title":"CoRR"},{"key":"ref8","article-title":"Plug and play language models: A simple approach to controlled text generation","volume-title":"Proceedings of the International Conference on Learning Representations","author":"Dathathri"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.findings-emnlp.424"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.acl-long.522"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.emnlp-main.223"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.acllong.353"},{"key":"ref13","article-title":"Controllable text generation with residual memory transformer","volume":"abs\/2309.16231","author":"Zhang","year":"2023","journal-title":"CoRR"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.findings-acl.229"},{"key":"ref15","doi-asserted-by":"crossref","DOI":"10.2139\/ssrn.5165270","article-title":"Prompting science report 1: Prompt engineering is complicated and contingent","volume-title":"Tech. Rep.","author":"Meincke","year":"2025"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1002\/jocb.671"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-main.346"},{"key":"ref18","article-title":"Large language models as optimizers","volume-title":"Proceedings of the International Conference on Learning Representations","author":"Yang"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.naacl-main.403"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.emnlp-main.222"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1339"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.findings-emnlp.301"},{"key":"ref23","article-title":"A neural probabilistic language model","volume":"13","author":"Bengio","year":"2000","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1707.06347"},{"key":"ref25","article-title":"TRL: Transformer reinforcement learning","author":"von Werra","year":"2020"},{"key":"ref26","article-title":"Adam: A method for stochastic optimization","volume":"abs\/1412.6980","author":"Kingma","year":"2017","journal-title":"CoRR"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D13-1170"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.5555\/2002472.2002491"},{"key":"ref29","article-title":"Openwebtext corpus","author":"Gokaslan","year":"2019"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-demos.6"},{"issue":"8","key":"ref31","first-page":"9","article-title":"Language models are unsupervised multitask learners","volume":"1","author":"Radford","year":"2019","journal-title":"OpenAI Blog"},{"key":"ref32","article-title":"DistilBERT, a distilled version of BERT: smaller, faster, cheaper and lighter","volume":"abs\/1910.01108","author":"Sanh","year":"2019","journal-title":"CoRR"},{"key":"ref33","article-title":"Introducing Llama 3.1: Our most capable models to date","year":"2024"},{"key":"ref34","article-title":"Detoxify","author":"Hanu","year":"2020"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N19-1117"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1005"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00360"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLA55696.2022.00166"},{"key":"ref39","article-title":"Multimodal paralinguistic prompting for large language models","author":"Yang","year":"2023"}],"event":{"name":"2025 International Conference on Machine Learning and Applications (ICMLA)","location":"Boca Raton, FL, USA","start":{"date-parts":[[2025,12,3]]},"end":{"date-parts":[[2025,12,5]]}},"container-title":["2025 International Conference on Machine Learning and Applications (ICMLA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11471302\/11471304\/11471444.pdf?arnumber=11471444","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,8]],"date-time":"2026-04-08T05:38:14Z","timestamp":1775626694000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11471444\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,3]]},"references-count":39,"URL":"https:\/\/doi.org\/10.1109\/icmla66185.2025.00134","relation":{},"subject":[],"published":{"date-parts":[[2025,12,3]]}}}