{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T15:03:25Z","timestamp":1743087805353,"version":"3.40.3"},"publisher-location":"Singapore","reference-count":29,"publisher":"Springer Nature Singapore","isbn-type":[{"type":"print","value":"9789819755806"},{"type":"electronic","value":"9789819755813"}],"license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024]]},"DOI":"10.1007\/978-981-97-5581-3_34","type":"book-chapter","created":{"date-parts":[[2024,8,1]],"date-time":"2024-08-01T19:02:53Z","timestamp":1722538973000},"page":"419-431","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Calibrating the Converted Spiking Reinforcement Learning"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0002-7528-897X","authenticated-orcid":false,"given":"Jian","family":"Song","sequence":"first","affiliation":[]},{"given":"Xiangfei","family":"Yang","sequence":"additional","affiliation":[]},{"given":"Xuetao","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Donglin","family":"Wang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,8,1]]},"reference":[{"issue":"7784","key":"34_CR1","doi-asserted-by":"publisher","first-page":"607","DOI":"10.1038\/s41586-019-1677-2","volume":"575","author":"K Roy","year":"2019","unstructured":"Roy, K., Jaiswal, A., Panda, P.: Towards spike-based machine intelligence with neuromorphic computing. Nature 575(7784), 607\u2013617 (2019)","journal-title":"Nature"},{"issue":"8","key":"34_CR2","doi-asserted-by":"publisher","first-page":"5200","DOI":"10.1109\/TNNLS.2021.3119238","volume":"34","author":"Y Hu","year":"2021","unstructured":"Hu, Y., Tang, H., Pan, G.: Spiking deep residual networks. IEEE Trans. Neural Netw. Learn. Syst. 34(8), 5200\u20135205 (2021)","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"34_CR3","first-page":"21056","volume":"34","author":"W Fang","year":"2021","unstructured":"Fang, W., Yu, Z., Chen, Y., et al.: Deep residual learning in spiking neural networks. Adv. Neural. Inf. Process. Syst. 34, 21056\u201321069 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"34_CR4","unstructured":"Lv, C., Li, T., Xu, J., et al.: SpikeBERT: a language spikformer trained with two-stage knowledge distillation from BERT. arXiv (2023)"},{"key":"34_CR5","doi-asserted-by":"crossref","unstructured":"Roy, D., Chakraborty, I., Roy, K.: Scaling deep spiking neural networks with binary stochastic activations. In: 2019 IEEE International Conference on Cognitive Computing (ICCC), pp. 50\u201358. IEEE (2019)","DOI":"10.1109\/ICCC.2019.00020"},{"key":"34_CR6","doi-asserted-by":"publisher","first-page":"294","DOI":"10.1016\/j.neunet.2019.09.005","volume":"121","author":"L Deng","year":"2020","unstructured":"Deng, L., Wu, Y., Hu, X., et al.: Rethinking the performance comparison between SNNs and ANNs. Neural Netw. 121, 294\u2013307 (2020)","journal-title":"Neural Netw."},{"key":"34_CR7","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1146\/annurev.neuro.31.060407.125639","volume":"31","author":"N Caporale","year":"2008","unstructured":"Caporale, N., Dan, Y.: Spike timing\u2013dependent plasticity: a hebbian learning rule. Annu. Rev. Neurosci. 31, 25\u201346 (2008)","journal-title":"Annu. Rev. Neurosci."},{"issue":"6","key":"34_CR8","doi-asserted-by":"publisher","first-page":"51","DOI":"10.1109\/MSP.2019.2931595","volume":"36","author":"EO Neftci","year":"2019","unstructured":"Neftci, E.O., Mostafa, H., Zenke, F.: Surrogate gradient learning in spiking neural networks: bringing the power of gradient-based optimization to spiking neural networks. IEEE Signal Process. Mag. 36(6), 51\u201363 (2019)","journal-title":"IEEE Signal Process. Mag."},{"key":"34_CR9","doi-asserted-by":"publisher","first-page":"54","DOI":"10.1007\/s11263-014-0788-3","volume":"113","author":"Y Cao","year":"2015","unstructured":"Cao, Y., Chen, Y., Khosla, D.: Spiking deep convolutional neural networks for energy-efficient object recognition. Int. J. Comput. Vision 113, 54\u201366 (2015)","journal-title":"Int. J. Comput. Vision"},{"key":"34_CR10","doi-asserted-by":"crossref","unstructured":"Wu, Y., Deng, L., Li, G., Zhu, J., Shi, L.: Spatio-temporal backpropagation for training high-performance spiking neural networks. Front. Neurosci. 12(331) (2018)","DOI":"10.3389\/fnins.2018.00331"},{"key":"34_CR11","unstructured":"Zhang, W., Li, P.: Temporal spike sequence learning via backpropagation for deep spiking neural networks. In: Advances in Neural Information Processing Systems, pp. 12022\u201312033 (2020)"},{"key":"34_CR12","doi-asserted-by":"crossref","unstructured":"Wu, Y., Deng, L., Li, G., Zhu, J., Xie, Y., Shi, L.: Direct training for spiking neural networks: faster, larger, better. In: Proceedings of the AAAI Conference on Artificial Intelligence, pp. 1311\u20131318 (2019)","DOI":"10.1609\/aaai.v33i01.33011311"},{"key":"34_CR13","unstructured":"Hao, Z., Ding, J., Bu, T., Huang, T., Yu, Z.: Bridging the gap between ANNs and SNNs by calibrating offset spikes. arXiv (2023)"},{"key":"34_CR14","unstructured":"Fujimoto, S., Gu, S.S.: A minimalist approach to offline reinforcement learning. In: Advances in Neural Information Processing Systems, pp. 20132\u201320145 (2021)"},{"key":"34_CR15","doi-asserted-by":"crossref","unstructured":"Todorov, E., Erez, T., Mujoco, Y.T.: A physics engine for model-based control. In: 2012 IEEE\/RSJ International Conference on Intelligent Robots and Systems, pp. 5026\u20135033. IEEE (2012)","DOI":"10.1109\/IROS.2012.6386109"},{"key":"34_CR16","doi-asserted-by":"crossref","unstructured":"Prudencio, R.F., Maximo, M, Colombini, E.L.: A survey on offline reinforcement learning: taxonomy, review, and open problems. IEEE Trans. Neural Netw. Learn. Syst. (2023)","DOI":"10.1109\/TNNLS.2023.3250269"},{"issue":"6","key":"34_CR17","doi-asserted-by":"publisher","first-page":"1063","DOI":"10.1016\/S0896-6273(03)00761-X","volume":"40","author":"H Seung","year":"2003","unstructured":"Seung, H.: Learning in spiking neural networks by reinforcement of stochastic synaptic transmission. Neuron 40(6), 1063\u20131073 (2003)","journal-title":"Neuron"},{"issue":"2","key":"34_CR18","doi-asserted-by":"publisher","first-page":"301","DOI":"10.1162\/neco.2008.08-07-593","volume":"21","author":"W Potjans","year":"2009","unstructured":"Potjans, W., Morrison, A., Diesmann, M.: A spiking neural network model of an actor-critic learning agent. Neural Comput. 21(2), 301\u2013339 (2009)","journal-title":"Neural Comput."},{"issue":"6","key":"34_CR19","doi-asserted-by":"publisher","first-page":"1468","DOI":"10.1162\/neco.2007.19.6.1468","volume":"19","author":"RV Florian","year":"2007","unstructured":"Florian, R.V.: Reinforcement learning through modulation of spike-timing dependent synaptic plasticity. Neural Comput. 19(6), 1468\u20131502 (2007)","journal-title":"Neural Comput."},{"key":"34_CR20","doi-asserted-by":"crossref","unstructured":"Bing, Z., Claus, Meschede, K., Chen, G., et al.: End to end learning of spiking neural network based on R-STDP for a lane keeping vehicle. In: 2018 IEEE International Conference on Robotics and Automation (ICRA), pp. 4725\u20134732. IEEE (2018)","DOI":"10.1109\/ICRA.2018.8460482"},{"key":"34_CR21","doi-asserted-by":"publisher","first-page":"108","DOI":"10.1016\/j.neunet.2019.08.009","volume":"120","author":"D Patel","year":"2019","unstructured":"Patel, D., Hazan, H., Saunders, D.J., Hava, T., Siegelmann, R.K.: Improved robustness of reinforcement learning policies upon conversion to spiking neuronal network platforms applied to atari breakout game. Neural Netw. 120, 108\u2013115 (2019)","journal-title":"Neural Netw."},{"key":"34_CR22","doi-asserted-by":"crossref","unstructured":"Tan, W., Patel, D., Kozma, R.: Strategy and benchmark for converting deep q-networks to event-driven spiking neural networks. In: Proceedings of the AAAI Conference on Artificial Intelligence, pp. 9816\u20139824 (2021)","DOI":"10.1609\/aaai.v35i11.17180"},{"key":"34_CR23","doi-asserted-by":"crossref","unstructured":"Diehl, P.U., Neil, D., Binas, J., Cook, M., Liu, S.C., Pfeiffer, M.: Fast-classifying, high-accuracy spiking deep networks through weight and threshold balancing. In: 2015 International Joint Conference on Neural Networks (IJCNN), pp. 1\u20138. IEEE (2015)","DOI":"10.1109\/IJCNN.2015.7280696"},{"key":"34_CR24","doi-asserted-by":"crossref","unstructured":"Rueckauer, B., Lungu, I.A., Hu, Y., Pfeiffer, M., Liu, S.C.: Conversion of continuous-valued deep networks to efficient event-driven networks for image classification. Front. Neurosci. 11 (2017)","DOI":"10.3389\/fnins.2017.00682"},{"key":"34_CR25","unstructured":"Deng, S., Gu, S.: Optimal conversion of conventional artificial neural networks to spiking neural networks. arXiv (2021)"},{"key":"34_CR26","unstructured":"Li, Y., Deng, S., Dong, X., Gong, R., Gu, S.: A free lunch from ANN: towards efficient, accurate spiking neural networks calibration. In: International Conference on Machine Learning, pp. 6316\u20136325. PMLR (2021)"},{"key":"34_CR27","unstructured":"Bu, T., Fang, W., Ding, J., et al.: Optimal ANN-SNN conversion for high-accuracy and ultra-low-latency spiking neural networks. arXiv (2023)"},{"key":"34_CR28","unstructured":"Fu, J., Kumar, A., Nachum, O., Tucker, G., Levine, S.: D4RL: datasets for deep data-driven reinforcement learning. arXiv (2020)"},{"key":"34_CR29","doi-asserted-by":"crossref","unstructured":"Qin, L., Yan, R., Tang, H.: A low latency adaptive coding spike framework for deep reinforcement learning. In: Proceedings of the Thirty-Second International Joint Conference on Artificial Intelligence, pp. 3049\u20133057 (2023)","DOI":"10.24963\/ijcai.2023\/340"}],"container-title":["Lecture Notes in Computer Science","Advanced Intelligent Computing Technology and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-97-5581-3_34","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,1]],"date-time":"2024-08-01T19:18:51Z","timestamp":1722539931000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-97-5581-3_34"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"ISBN":["9789819755806","9789819755813"],"references-count":29,"URL":"https:\/\/doi.org\/10.1007\/978-981-97-5581-3_34","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2024]]},"assertion":[{"value":"1 August 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors declare that they have no competing interests.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"ICIC","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Intelligent Computing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Tianjin","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"5 August 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"8 August 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"20","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icic2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.ic-icc.cn\/2024\/index.htm","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}