{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,7]],"date-time":"2026-02-07T08:56:36Z","timestamp":1770454596834,"version":"3.49.0"},"reference-count":43,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,7]]},"DOI":"10.1109\/infocom41043.2020.9155267","type":"proceedings-article","created":{"date-parts":[[2020,8,4]],"date-time":"2020-08-04T22:29:35Z","timestamp":1596580175000},"page":"1668-1677","source":"Crossref","is-referenced-by-count":43,"title":["Automating Cloud Deployment for Deep Learning Inference of Real-time Online Services"],"prefix":"10.1109","author":[{"given":"Yang","family":"Li","sequence":"first","affiliation":[]},{"given":"Zhenhua","family":"Han","sequence":"additional","affiliation":[]},{"given":"Quanlu","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Zhenhua","family":"Li","sequence":"additional","affiliation":[]},{"given":"Haisheng","family":"Tan","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"crossref","first-page":"671","DOI":"10.1126\/science.220.4598.671","article-title":"Optimization by Simulated Annealing","volume":"220","author":"kirkpatrick","year":"1983","journal-title":"Science"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1002\/j.1538-7305.1970.tb01770.x"},{"key":"ref33","article-title":"Low-Level Augmented Bayesian Optimization for Finding the Best Cloud VM","author":"hsu","year":"2017","journal-title":"arXiv preprint arXiv 1712 10081"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.25080\/Majora-8b375195-003"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/SERVICES.2013.55"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/TST.2017.7830891"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/3317689"},{"key":"ref36","article-title":"Accelerating CNN Inference on FPGAs: A Survey","author":"abdelouahab","year":"2018","journal-title":"arXiv preprint arXiv 1806 01683"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1145\/3190508.3190541"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1080\/00949655.2014.1002101"},{"key":"ref10","article-title":"Google&#x2019;s Neural Machine Translation System: Bridging the Gap between Human and Machine Translation","author":"wu","year":"2016","journal-title":"arXiv preprint arXiv 1609 04802"},{"key":"ref40","first-page":"175","article-title":"A Linear-time Heuristic for Improving Network Partitions","author":"fiduccia","year":"1982"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2017.83"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2008.07.035"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3135974.3135993"},{"key":"ref14","first-page":"4","article-title":"CherryPick: Adaptively Unearthing the Best Cloud Configurations for Big Data Analytics","volume":"2","author":"alipourfard","year":"2017","journal-title":"Proc of USENIX NSDI"},{"key":"ref15","article-title":"Device Placement Optimization with Reinforcement Learning","author":"mirhoseini","year":"2017","journal-title":"arXiv preprint arXiv 1706 04972"},{"key":"ref16","first-page":"1662","article-title":"Spotlight: Optimizing Device Placement for Training Deep Neural Networks","author":"gao","year":"2018","journal-title":"Proc of ICML"},{"key":"ref17","first-page":"265","article-title":"Tensorflow: A System for Large-scale Machine Learning","volume":"16","author":"abadi","year":"2016","journal-title":"Proc of USENIX OSDI"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.308"},{"key":"ref28","article-title":"Adam: A Method for Stochastic Optimization","author":"kingma","year":"2014","journal-title":"arXiv preprint arXiv 1412 6980"},{"key":"ref4","first-page":"1764","article-title":"Towards End-to-end Speech Recognition with Recurrent Neural Networks","author":"graves","year":"2014","journal-title":"Proc of ICML"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1023\/A:1008306431147"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2012.2205597"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472621"},{"key":"ref29","doi-asserted-by":"crossref","first-page":"229","DOI":"10.1007\/BF00992696","article-title":"Simple Statistical Gradient-following Algorithms for Connectionist Reinforcement Learning","volume":"8","author":"williams","year":"1992","journal-title":"Machine Learning"},{"key":"ref5","article-title":"Deep Speech: Scaling up End-to-end Speech Recognition","author":"hannun","year":"2014","journal-title":"arXiv preprint arXiv 1412 5567"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1179"},{"key":"ref7","first-page":"3104","article-title":"Sequence to Sequence Learning with Neural Networks","author":"sutskever","year":"2014","journal-title":"Proc of NIPS"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref9","article-title":"Neural Machine Translation by Jointly Learning to Align and Translate","author":"bahdanau","year":"2014","journal-title":"arXiv preprint arXiv 1409 0473"},{"key":"ref1","first-page":"1097","article-title":"Imagenet Classification with Deep Convolutional Neural Networks","author":"krizhevsky","year":"2012","journal-title":"Proc of NIPS"},{"key":"ref20","first-page":"595","article-title":"Gandiva: Introspective Cluster Scheduling for Deep Learning","author":"xiao","year":"2018","journal-title":"Proc of USENIX OSDI"},{"key":"ref22","article-title":"Distillating Knowledge about Scotch","author":"pellegrini","year":"2009","journal-title":"Dagstuhl Seminar Proceedings"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/3132747.3132766"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/43.159993"},{"key":"ref24","article-title":"Neural combinatorial optimization with reinforcement learning","author":"bello","year":"2016","journal-title":"arXiv preprint arXiv 1611 09940"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1287\/opre.37.6.865"},{"key":"ref23","article-title":"METIS-Unstructured Graph Partitioning and Sparse Matrix Ordering System, Version 2.0","author":"karypis","year":"1995"},{"key":"ref26","first-page":"2951","article-title":"Practical Bayesian Optimization of Machine Learning Algorithms","author":"snoek","year":"2012","journal-title":"Proc of NIPS"},{"key":"ref43","article-title":"Placeto: Efficient Progressive Device Placement Optimization","author":"addanki","year":"2018","journal-title":"Proc NIPS Workshop Mach Learn Syst"},{"key":"ref25","first-page":"525","article-title":"BOA: The Bayesian Optimization Algorithm","author":"pelikan","year":"1999","journal-title":"Proc of GECCO"}],"event":{"name":"IEEE INFOCOM 2020 - IEEE Conference on Computer Communications","location":"Toronto, ON, Canada","start":{"date-parts":[[2020,7,6]]},"end":{"date-parts":[[2020,7,9]]}},"container-title":["IEEE INFOCOM 2020 - IEEE Conference on Computer Communications"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9146503\/9155217\/09155267.pdf?arnumber=9155267","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,28]],"date-time":"2022-06-28T21:50:59Z","timestamp":1656453059000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9155267\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,7]]},"references-count":43,"URL":"https:\/\/doi.org\/10.1109\/infocom41043.2020.9155267","relation":{},"subject":[],"published":{"date-parts":[[2020,7]]}}}