{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,19]],"date-time":"2026-06-19T16:30:07Z","timestamp":1781886607053,"version":"3.54.5"},"reference-count":29,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,10,28]],"date-time":"2023-10-28T00:00:00Z","timestamp":1698451200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,10,28]],"date-time":"2023-10-28T00:00:00Z","timestamp":1698451200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"NSFC","doi-asserted-by":"publisher","award":["62222607"],"award-info":[{"award-number":["62222607"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,10,28]]},"DOI":"10.1109\/iccad57390.2023.10323973","type":"proceedings-article","created":{"date-parts":[[2023,11,30]],"date-time":"2023-11-30T18:58:45Z","timestamp":1701370725000},"page":"1-9","source":"Crossref","is-referenced-by-count":8,"title":["EasySO: Exploration-enhanced Reinforcement Learning for Logic Synthesis Sequence Optimization and a Comprehensive RL Environment"],"prefix":"10.1109","author":[{"given":"Jianyong","family":"Yuan","sequence":"first","affiliation":[{"name":"Shanghai Jiao Tong University,MoE Key Lab of AI,Department of CSE,Shanghai,China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Peiyu","family":"Wang","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University,MoE Key Lab of AI,Department of CSE,Shanghai,China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Junjie","family":"Ye","sequence":"additional","affiliation":[{"name":"Huawei Noah&#x0027;s ark Lab, Shenzhen &#x0026; Hong Kong,Beijing,China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Mingxuan","family":"Yuan","sequence":"additional","affiliation":[{"name":"Huawei Noah&#x0027;s ark Lab, Shenzhen &#x0026; Hong Kong,Beijing,China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jianye","family":"Hao","sequence":"additional","affiliation":[{"name":"Huawei Noah&#x0027;s ark Lab, Shenzhen &#x0026; Hong Kong,Beijing,China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Junchi","family":"Yan","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University,MoE Key Lab of AI,Department of CSE,Shanghai,China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3045014"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.23919\/DATE54114.2022.9774632"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ASP-DAC47756.2020.9045559"},{"key":"ref4","first-page":"1","article-title":"Batch sequential black-box optimization with embedding alignment cells for logic synthesis","volume-title":"Proceedings of the 41 st IEEE\/ACM International Conference on Computer-Aided Design","author":"Feng","year":"2022"},{"key":"ref5","volume-title":"Abc: A system for sequential synthesis and verification","author":"Synthesis"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3380446.3430622"},{"key":"ref7","article-title":"Rethinking reinforcement learning based logic synthesis","author":"Wang","year":"2022","journal-title":"arXiv preprint"},{"key":"ref8","article-title":"Prox-imal policy optimization algorithms","author":"Schulman","year":"2017","journal-title":"arXiv preprint"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2019\/316"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICFPT56656.2022.9974330"},{"issue":"CONF","key":"ref11","article-title":"The epfl combinational benchmark suite","volume-title":"Proceedings of the 24th International Workshop on Logic & Synthesis (lWLS)","author":"Amaru","year":"2015"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/3020078.3021735"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3268344"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/3489517.3530460"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ASP-DAC52403.2022.9712578"},{"key":"ref16","article-title":"Galois: Boosting deep reinforcement learning via generalizable logic synthesis","author":"Cao","year":"2022","journal-title":"arXiv preprint"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ISQED.2019.8697679"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/dac18074.2021.9586206"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TCSII.2022.3168344"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/11527862_14"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v30i1.10226"},{"key":"ref22","article-title":"Deep reinforcement learning in parame-terized action space","author":"Hausknecht","year":"2015","journal-title":"arXiv preprint"},{"key":"ref23","article-title":"Parametrized deep q-networks learning: Reinforcement learning with discrete-continuous hybrid action space","author":"Xiong","year":"2018","journal-title":"arXiv preprint"},{"key":"ref24","article-title":"Multi-pass q-networks for deep reinforcement learning with parameterised action spaces","author":"Bester","year":"2019","journal-title":"arXiv preprint"},{"key":"ref25","article-title":"Playing atari with deep reinforcement learning","author":"Mnih","year":"2013","journal-title":"arXiv preprint"},{"key":"ref26","article-title":"Continuous control with deep reinforcement learning","author":"Lillicrap","year":"2015","journal-title":"arXiv preprint"},{"key":"ref27","article-title":"Hyar: Addressing discrete-continuous action reinforcement learning via hybrid action representation","author":"Li","year":"2021","journal-title":"arXiv preprint"},{"key":"ref28","article-title":"High-dimensional continuous control using generalized advantage estimation","author":"Schulman","year":"2015","journal-title":"arXiv preprint"},{"key":"ref29","article-title":"Pytorch: An imperative style, high-performance deep learning library","author":"Paszke","year":"2019","journal-title":"NeurIPS"}],"event":{"name":"2023 IEEE\/ACM International Conference on Computer Aided Design (ICCAD)","location":"San Francisco, CA, USA","start":{"date-parts":[[2023,10,28]]},"end":{"date-parts":[[2023,11,2]]}},"container-title":["2023 IEEE\/ACM International Conference on Computer Aided Design (ICCAD)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10323590\/10323543\/10323973.pdf?arnumber=10323973","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,2]],"date-time":"2024-03-02T22:19:15Z","timestamp":1709417955000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10323973\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10,28]]},"references-count":29,"URL":"https:\/\/doi.org\/10.1109\/iccad57390.2023.10323973","relation":{},"subject":[],"published":{"date-parts":[[2023,10,28]]}}}