{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,27]],"date-time":"2026-04-27T10:48:09Z","timestamp":1777286889863,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":80,"publisher":"ACM","license":[{"start":{"date-parts":[[2020,7,30]],"date-time":"2020-07-30T00:00:00Z","timestamp":1596067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/100000185","name":"Defense Advanced Research Projects Agency","doi-asserted-by":"publisher","award":["BRASS"],"award-info":[{"award-number":["BRASS"]}],"id":[{"id":"10.13039\/100000185","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["CNS-1901466, CCF-1439156,CNS-1526304, CCF-1823032, CNS-1764039"],"award-info":[{"award-number":["CNS-1901466, CCF-1439156,CNS-1526304, CCF-1823032, CNS-1764039"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000015","name":"U.S. Department of Energy","doi-asserted-by":"publisher","award":["DESC0014195 0003"],"award-info":[{"award-number":["DESC0014195 0003"]}],"id":[{"id":"10.13039\/100000015","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000183","name":"Army Research Office","doi-asserted-by":"publisher","award":["W911NF1920321"],"award-info":[{"award-number":["W911NF1920321"]}],"id":[{"id":"10.13039\/100000183","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100006785","name":"Google","doi-asserted-by":"publisher","award":["Faculty Research Award"],"award-info":[{"award-number":["Faculty Research Award"]}],"id":[{"id":"10.13039\/100006785","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2020,7,30]]},"DOI":"10.1145\/3387514.3405887","type":"proceedings-article","created":{"date-parts":[[2020,7,30]],"date-time":"2020-07-30T22:35:31Z","timestamp":1596148531000},"page":"557-570","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":200,"title":["Server-Driven Video Streaming for Deep Learning Inference"],"prefix":"10.1145","author":[{"given":"Kuntai","family":"Du","sequence":"first","affiliation":[{"name":"University of Chicago"}]},{"given":"Ahsan","family":"Pervaiz","sequence":"additional","affiliation":[{"name":"University of Chicago"}]},{"given":"Xin","family":"Yuan","sequence":"additional","affiliation":[{"name":"University of Chicago"}]},{"given":"Aakanksha","family":"Chowdhery","sequence":"additional","affiliation":[{"name":"University of Chicago"}]},{"given":"Qizheng","family":"Zhang","sequence":"additional","affiliation":[{"name":"University of Chicago"}]},{"given":"Henry","family":"Hoffmann","sequence":"additional","affiliation":[{"name":"University of Chicago"}]},{"given":"Junchen","family":"Jiang","sequence":"additional","affiliation":[{"name":"University of Chicago"}]}],"member":"320","published-online":{"date-parts":[[2020,7,30]]},"reference":[{"key":"e_1_3_2_2_1_1","unstructured":"4g\/lte bandwidth logs. http:\/\/users.ugent.be\/~jvdrhoof\/dataset-4g\/.  4g\/lte bandwidth logs. http:\/\/users.ugent.be\/~jvdrhoof\/dataset-4g\/."},{"key":"e_1_3_2_2_2_1","unstructured":"Are we ready for ai-powered security cameras? https:\/\/thenewstack.io\/are-we-ready-for-ai-powered-security-cameras\/.  Are we ready for ai-powered security cameras? https:\/\/thenewstack.io\/are-we-ready-for-ai-powered-security-cameras\/."},{"key":"e_1_3_2_2_3_1","unstructured":"At&t unlimited data plans with talk & text. https:\/\/www.att.com\/plans\/unlimited-data-plans\/. (Accessed on 06\/15\/2020).  At&t unlimited data plans with talk & text. https:\/\/www.att.com\/plans\/unlimited-data-plans\/. (Accessed on 06\/15\/2020)."},{"key":"e_1_3_2_2_4_1","unstructured":"Benchmarking videos used in dds. https:\/\/github.com\/KuntaiDu\/dds.  Benchmarking videos used in dds. https:\/\/github.com\/KuntaiDu\/dds."},{"key":"e_1_3_2_2_5_1","unstructured":"Can 30 000 cameras help solve chicago's crime problem? https:\/\/www.nytimes.com\/2018\/05\/26\/us\/chicago-police-surveillance.html.  Can 30 000 cameras help solve chicago's crime problem? https:\/\/www.nytimes.com\/2018\/05\/26\/us\/chicago-police-surveillance.html."},{"key":"e_1_3_2_2_6_1","unstructured":"Cloud-based video analytics as a service of 2018. https:\/\/www.asmag.com\/showpost\/27143.aspx.  Cloud-based video analytics as a service of 2018. https:\/\/www.asmag.com\/showpost\/27143.aspx."},{"key":"e_1_3_2_2_7_1","unstructured":"Dashjs. https:\/\/github.com\/Dash-Industry-Forum\/dash.js.  Dashjs. https:\/\/github.com\/Dash-Industry-Forum\/dash.js."},{"key":"e_1_3_2_2_8_1","unstructured":"Dds: Machine-centric video streaming. https:\/\/github.com\/KuntaiDu\/dds.  Dds: Machine-centric video streaming. https:\/\/github.com\/KuntaiDu\/dds."},{"key":"e_1_3_2_2_9_1","unstructured":"Faster r-cnn on jetson tx2. https:\/\/jkjung-avt.github.io\/faster-rcnn\/. Accessed: 7\/3\/2020.  Faster r-cnn on jetson tx2. https:\/\/jkjung-avt.github.io\/faster-rcnn\/. Accessed: 7\/3\/2020."},{"key":"e_1_3_2_2_10_1","unstructured":"Fastest wireless network in 2020: We tested 8 carriers to crown a winner | tom's guide. https:\/\/www.tomsguide.com\/us\/best-mobile-network.review-2942.html. (Accessed on 06\/15\/2020).  Fastest wireless network in 2020: We tested 8 carriers to crown a winner | tom's guide. https:\/\/www.tomsguide.com\/us\/best-mobile-network.review-2942.html. (Accessed on 06\/15\/2020)."},{"key":"e_1_3_2_2_11_1","unstructured":"Gpus pricing | compute engine documentation | google cloud. https:\/\/cloud.google.com\/compute\/gpus-pricing. (Accessed on 06\/21\/2020).  Gpus pricing | compute engine documentation | google cloud. https:\/\/cloud.google.com\/compute\/gpus-pricing. (Accessed on 06\/21\/2020)."},{"key":"e_1_3_2_2_12_1","unstructured":"How ai based video analytics is benefiting retail industry. https:\/\/www.lanner-america.com\/blog\/ai-based-video-analytics-benefiting-retail-industry\/.  How ai based video analytics is benefiting retail industry. https:\/\/www.lanner-america.com\/blog\/ai-based-video-analytics-benefiting-retail-industry\/."},{"key":"e_1_3_2_2_13_1","unstructured":"Hp r0w29a tesla t4 graphic card - 1 gpus - 16 gb. https:\/\/www.amazon.com\/HP-R0W29A-Tesla-Graphic-Card\/dp\/B07PGY6QPT\/. Accessed: 2020-1-29.  Hp r0w29a tesla t4 graphic card - 1 gpus - 16 gb. https:\/\/www.amazon.com\/HP-R0W29A-Tesla-Graphic-Card\/dp\/B07PGY6QPT\/. Accessed: 2020-1-29."},{"key":"e_1_3_2_2_14_1","unstructured":"Insightface: 2d and 3d face analysis project. https:\/\/github.com\/deepinsight\/insightface.  Insightface: 2d and 3d face analysis project. https:\/\/github.com\/deepinsight\/insightface."},{"key":"e_1_3_2_2_15_1","unstructured":"Jetson tx2. https:\/\/www.nvidia.com\/en-us\/autonomous-machines\/embedded-systems\/jetson-tx2\/. Accessed: 7\/3\/2020.  Jetson tx2. https:\/\/www.nvidia.com\/en-us\/autonomous-machines\/embedded-systems\/jetson-tx2\/. Accessed: 7\/3\/2020."},{"key":"e_1_3_2_2_16_1","unstructured":"Nvidia deep learning inference technical overview table \"jetson tx2 (maxq mode)\" at row resnet50 batch size 128. http:\/\/www.nextplatform.com\/wp-content\/uploads\/2018\/01\/inference-technical-overview-1.pdf. Accessed: 7\/3\/2020.  Nvidia deep learning inference technical overview table \"jetson tx2 (maxq mode)\" at row resnet50 batch size 128. http:\/\/www.nextplatform.com\/wp-content\/uploads\/2018\/01\/inference-technical-overview-1.pdf. Accessed: 7\/3\/2020."},{"key":"e_1_3_2_2_17_1","unstructured":"Nvidia tesla deep learning product performance (table \"t4 inference performance\" at row resnet50 batch size 128). https:\/\/developer.nvidia.com\/deep-learning-performance-training-inference. Accessed: 7\/3\/2020.  Nvidia tesla deep learning product performance (table \"t4 inference performance\" at row resnet50 batch size 128). https:\/\/developer.nvidia.com\/deep-learning-performance-training-inference. Accessed: 7\/3\/2020."},{"key":"e_1_3_2_2_18_1","unstructured":"Official implementation of efficient cascading residual network for sr. https:\/\/github.com\/nmhkahn\/CARN-pytorch.  Official implementation of efficient cascading residual network for sr. https:\/\/github.com\/nmhkahn\/CARN-pytorch."},{"key":"e_1_3_2_2_19_1","unstructured":"Smraza raspberry pi 4 camera module 5 megapixels 1080p. https:\/\/www.amazon.com\/Smraza-Raspberry-Megapixels-Adjustable-Fish-Eye\/dp\/B07L2SY756\/. Accessed: 2020-1-29.  Smraza raspberry pi 4 camera module 5 megapixels 1080p. https:\/\/www.amazon.com\/Smraza-Raspberry-Megapixels-Adjustable-Fish-Eye\/dp\/B07L2SY756\/. Accessed: 2020-1-29."},{"key":"e_1_3_2_2_20_1","unstructured":"Tensorflow detection model zoo. https:\/\/github.com\/tensorflow\/models\/blob\/master\/research\/object_detection\/g3doc\/detection_model_zoo.md.  Tensorflow detection model zoo. https:\/\/github.com\/tensorflow\/models\/blob\/master\/research\/object_detection\/g3doc\/detection_model_zoo.md."},{"key":"e_1_3_2_2_21_1","unstructured":"Video meets the internet of things. https:\/\/www.mckinsey.com\/industries\/high-tech\/our-insights\/video-meets-the-internet-of-things.  Video meets the internet of things. https:\/\/www.mckinsey.com\/industries\/high-tech\/our-insights\/video-meets-the-internet-of-things."},{"key":"e_1_3_2_2_22_1","unstructured":"Videosurveillance:Howtechnologyandthecloudisdisruptingthemarket.https:\/\/cdn.ihs.com\/www\/pdf\/IHS-Markit-Technology-Video-surveillance.pdf.  Videosurveillance:Howtechnologyandthecloudisdisruptingthemarket.https:\/\/cdn.ihs.com\/www\/pdf\/IHS-Markit-Technology-Video-surveillance.pdf."},{"key":"e_1_3_2_2_23_1","unstructured":"Vision meets drones: A challenge. http:\/\/www.aiskyeye.com\/.  Vision meets drones: A challenge. http:\/\/www.aiskyeye.com\/."},{"key":"e_1_3_2_2_24_1","unstructured":"Wi-fi vs. cellular: Which is better for iot? https:\/\/www.verypossible.com\/blog\/wi-fi-vs-cellular-which-is-better-for-iot.  Wi-fi vs. cellular: Which is better for iot? https:\/\/www.verypossible.com\/blog\/wi-fi-vs-cellular-which-is-better-for-iot."},{"key":"e_1_3_2_2_25_1","unstructured":"x264 open source video lan. https:\/\/www.videolan.org\/developers\/x264.html.  x264 open source video lan. https:\/\/www.videolan.org\/developers\/x264.html."},{"key":"e_1_3_2_2_26_1","first-page":"252","volume-title":"Proceedings of the European Conference on Computer Vision (ECCV)","author":"Ahn Namhyuk","year":"2018","unstructured":"Namhyuk Ahn , Byungkon Kang , and Kyung-Ah Sohn . Fast, accurate , and light-weight super-resolution with cascading residual network . In Proceedings of the European Conference on Computer Vision (ECCV) , pages 252 -- 268 , 2018 . Namhyuk Ahn, Byungkon Kang, and Kyung-Ah Sohn. Fast, accurate, and light-weight super-resolution with cascading residual network. In Proceedings of the European Conference on Computer Vision (ECCV), pages 252--268, 2018."},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"publisher","DOI":"10.1109\/MC.2017.3641638"},{"key":"e_1_3_2_2_28_1","doi-asserted-by":"publisher","DOI":"10.1109\/MS.2018.2884864"},{"key":"e_1_3_2_2_29_1","volume-title":"End-to-end object detection with transformers. arXiv preprint arXiv.2005.12872","author":"Carion Nicolas","year":"2020","unstructured":"Nicolas Carion , Francisco Massa , Gabriel Synnaeve , Nicolas Usunier , Alexander Kirillov , and Sergey Zagoruyko . End-to-end object detection with transformers. arXiv preprint arXiv.2005.12872 , 2020 . Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-end object detection with transformers. arXiv preprint arXiv.2005.12872, 2020."},{"key":"e_1_3_2_2_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/2809695.2809711"},{"key":"e_1_3_2_2_31_1","volume-title":"Adascale: Towards realtime video object detection using adaptive scaling. arXiv preprint arXiv:1902.02910","author":"Chin Ting-Wu","year":"2019","unstructured":"Ting-Wu Chin , Ruizhou Ding , and Diana Marculescu . Adascale: Towards realtime video object detection using adaptive scaling. arXiv preprint arXiv:1902.02910 , 2019 . Ting-Wu Chin, Ruizhou Ding, and Diana Marculescu. Adascale: Towards realtime video object detection using adaptive scaling. arXiv preprint arXiv:1902.02910, 2019."},{"key":"e_1_3_2_2_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/3286062.3286070"},{"key":"e_1_3_2_2_33_1","volume-title":"265 and iso","author":"Video Coding High Efficiency","year":"2013","unstructured":"High Efficiency Video Coding and ITUT Rec . H. 265 and iso , 2013 . High Efficiency Video Coding and ITUT Rec. H. 265 and iso, 2013."},{"key":"e_1_3_2_2_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00482"},{"key":"e_1_3_2_2_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/2018436.2018478"},{"key":"e_1_3_2_2_36_1","doi-asserted-by":"publisher","DOI":"10.1145\/3349614.3356023"},{"key":"e_1_3_2_2_37_1","doi-asserted-by":"publisher","DOI":"10.1145\/2568225.2568272"},{"key":"e_1_3_2_2_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/3301293.3302365"},{"key":"e_1_3_2_2_39_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"e_1_3_2_2_40_1","volume-title":"High-speed tracking with kernelized correlation filters","author":"Henriques Jo\u00e3o F","year":"2014","unstructured":"Jo\u00e3o F Henriques , Rui Caseiro , Pedro Martins , and Jorge Batista . High-speed tracking with kernelized correlation filters . IEEE transactions on pattern analysis and machine intelligence, 37(3):583--596, 2014 . Jo\u00e3o F Henriques, Rui Caseiro, Pedro Martins, and Jorge Batista. High-speed tracking with kernelized correlation filters. IEEE transactions on pattern analysis and machine intelligence, 37(3):583--596, 2014."},{"key":"e_1_3_2_2_41_1","volume-title":"Dec","author":"Hetang Congrui","year":"2017","unstructured":"Congrui Hetang , Hongwei Qin , Shaohui Liu , and Junjie Yan . Impression network for video object detection. https:\/\/arxiv.org\/pdf\/1712.05896.pdf , Dec 2017 . Congrui Hetang, Hongwei Qin, Shaohui Liu, and Junjie Yan. Impression network for video object detection. https:\/\/arxiv.org\/pdf\/1712.05896.pdf, Dec 2017."},{"key":"e_1_3_2_2_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/SEC.2018.00016"},{"key":"e_1_3_2_2_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/3301293.3302366"},{"key":"e_1_3_2_2_44_1","first-page":"29","volume-title":"2018 USENIX Annual Technical Conference (USENIX ATC 18)","author":"Jiang Angela H","year":"2018","unstructured":"Angela H Jiang , Daniel L-K Wong , Christopher Canel , Lilia Tang , Ishan Misra , Michael Kaminsky , Michael A Kozuch , Padmanabhan Pillai , David G Andersen , and Gregory R Ganger . Mainstream : Dynamic stem-sharing for multi-tenant video processing . In 2018 USENIX Annual Technical Conference (USENIX ATC 18) , pages 29 -- 42 , 2018 . Angela H Jiang, Daniel L-K Wong, Christopher Canel, Lilia Tang, Ishan Misra, Michael Kaminsky, Michael A Kozuch, Padmanabhan Pillai, David G Andersen, and Gregory R Ganger. Mainstream: Dynamic stem-sharing for multi-tenant video processing. In 2018 USENIX Annual Technical Conference (USENIX ATC 18), pages 29--42, 2018."},{"key":"e_1_3_2_2_45_1","doi-asserted-by":"publisher","DOI":"10.1145\/3230543.3230574"},{"key":"e_1_3_2_2_46_1","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2013.2291681"},{"issue":"3","key":"e_1_3_2_2_47_1","first-page":"44","article-title":"A survey on moving object detection and tracking in video surveillance system","volume":"2","author":"Joshi Kinjal A","year":"2012","unstructured":"Kinjal A Joshi and Darshak G Thakore . A survey on moving object detection and tracking in video surveillance system . International Journal of Soft Computing and Engineering , 2 ( 3 ): 44 -- 48 , 2012 . Kinjal A Joshi and Darshak G Thakore. A survey on moving object detection and tracking in video surveillance system. International Journal of Soft Computing and Engineering, 2(3):44--48, 2012.","journal-title":"International Journal of Soft Computing and Engineering"},{"key":"e_1_3_2_2_48_1","doi-asserted-by":"publisher","DOI":"10.14778\/3137628.3137664"},{"key":"e_1_3_2_2_49_1","doi-asserted-by":"publisher","DOI":"10.1109\/CPSNA.2015.23"},{"key":"e_1_3_2_2_50_1","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2013.2281542"},{"key":"e_1_3_2_2_51_1","volume-title":"Deeplens: Towards a visual data management system. arXiv preprint arXiv","author":"Krishnan Sanjay","year":"1812","unstructured":"Sanjay Krishnan , Adam Dziedzic , and Aaron J Elmore . Deeplens: Towards a visual data management system. arXiv preprint arXiv 1812 .07607, 2018. Sanjay Krishnan, Adam Dziedzic, and Aaron J Elmore. Deeplens: Towards a visual data management system. arXiv preprint arXiv 1812.07607, 2018."},{"key":"e_1_3_2_2_52_1","doi-asserted-by":"publisher","DOI":"10.1145\/2742647.2742663"},{"key":"e_1_3_2_2_53_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00718"},{"key":"e_1_3_2_2_54_1","doi-asserted-by":"publisher","DOI":"10.1145\/3300061.3300116"},{"key":"e_1_3_2_2_55_1","volume-title":"Mar","author":"Liu Mason","year":"2018","unstructured":"Mason Liu and Menglong Zhu . Mobile video object detection with temporally-aware feature maps. https:\/\/arxiv.org\/pdf\/1711.06368.pdf , Mar 2018 . Mason Liu and Menglong Zhu. Mobile video object detection with temporally-aware feature maps. https:\/\/arxiv.org\/pdf\/1711.06368.pdf, Mar 2018."},{"key":"e_1_3_2_2_56_1","first-page":"6738","volume-title":"CVPR","author":"Liu Weiyang","year":"2017","unstructured":"Weiyang Liu , Yandong Wen , Zhiding Yu , Ming Li , Bhiksha Raj , and Le Song . Sphereface : Deep hypersphere embedding for face recognition . In CVPR , pages 6738 -- 6746 , 2017 . Weiyang Liu, Yandong Wen, Zhiding Yu, Ming Li, Bhiksha Raj, and Le Song. Sphereface: Deep hypersphere embedding for face recognition. In CVPR, pages 6738--6746, 2017."},{"key":"e_1_3_2_2_57_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"e_1_3_2_2_58_1","doi-asserted-by":"publisher","DOI":"10.1145\/2987550.2987564"},{"key":"e_1_3_2_2_60_1","volume-title":"ASPLOS","author":"Mishra Nikita","year":"2018","unstructured":"Nikita Mishra , Connor Imes , John D. Lafferty , and Henry Hoffmann . CALOREE : learning control for predictable latency and low energy . In ASPLOS , 2018 . Nikita Mishra, Connor Imes, John D. Lafferty, and Henry Hoffmann. CALOREE: learning control for predictable latency and low energy. In ASPLOS, 2018."},{"key":"e_1_3_2_2_61_1","first-page":"2204","volume-title":"Advances in neural information processing systems","author":"Mnih Volodymyr","year":"2014","unstructured":"Volodymyr Mnih , Nicolas Heess , Alex Graves , Recurrent models of visual attention . In Advances in neural information processing systems , pages 2204 -- 2212 , 2014 . Volodymyr Mnih, Nicolas Heess, Alex Graves, et al. Recurrent models of visual attention. In Advances in neural information processing systems, pages 2204--2212, 2014."},{"key":"e_1_3_2_2_62_1","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2004.839611"},{"key":"e_1_3_2_2_63_1","volume-title":"10th USENIX Workshop on Hot Topics in Cloud Computing (HotCloud 18)","author":"Pakha Chrisma","year":"2018","unstructured":"Chrisma Pakha , Aakanksha Chowdhery , and Junchen Jiang . Reinventing video streaming for distributed vision analytics . In 10th USENIX Workshop on Hot Topics in Cloud Computing (HotCloud 18) , Boston, MA , July 2018 . USENIX Association. Chrisma Pakha, Aakanksha Chowdhery, and Junchen Jiang. Reinventing video streaming for distributed vision analytics. In 10th USENIX Workshop on Hot Topics in Cloud Computing (HotCloud 18), Boston, MA, July 2018. USENIX Association."},{"key":"e_1_3_2_2_64_1","volume-title":"Scanner: Efficient video analysis at scale. ACM Transactions on Graphics (TOG), 37(4):1--13","author":"Poms Alex","year":"2018","unstructured":"Alex Poms , Will Crichton , Pat Hanrahan , and Kayvon Fatahalian . Scanner: Efficient video analysis at scale. ACM Transactions on Graphics (TOG), 37(4):1--13 , 2018 . Alex Poms, Will Crichton, Pat Hanrahan, and Kayvon Fatahalian. Scanner: Efficient video analysis at scale. ACM Transactions on Graphics (TOG), 37(4):1--13, 2018."},{"key":"e_1_3_2_2_65_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.91"},{"key":"e_1_3_2_2_66_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.690"},{"key":"e_1_3_2_2_67_1","first-page":"91","volume-title":"Advances in neural information processing systems","author":"Ren Shaoqing","year":"2015","unstructured":"Shaoqing Ren , Kaiming He , Ross Girshick , and Jian Sun . Faster r-cnn: Towards real-time object detection with region proposal networks . In Advances in neural information processing systems , pages 91 -- 99 , 2015 . Shaoqing Ren, Kaiming He, Ross Girshick, and Jian Sun. Faster r-cnn: Towards real-time object detection with region proposal networks. In Advances in neural information processing systems, pages 91--99, 2015."},{"key":"e_1_3_2_2_68_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2577031"},{"key":"e_1_3_2_2_69_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00474"},{"key":"e_1_3_2_2_70_1","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2014.2360940"},{"key":"e_1_3_2_2_71_1","volume-title":"Fast video classification via adaptive cascading of deep models. arXiv preprint","author":"Shen Haichen","year":"2017","unstructured":"Haichen Shen , Seungyeop Han , Matthai Philipose , and Arvind Krishnamurthy . Fast video classification via adaptive cascading of deep models. arXiv preprint , 2017 . Haichen Shen, Seungyeop Han, Matthai Philipose, and Arvind Krishnamurthy. Fast video classification via adaptive cascading of deep models. arXiv preprint, 2017."},{"key":"e_1_3_2_2_72_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDCS.2017.226"},{"key":"e_1_3_2_2_73_1","doi-asserted-by":"publisher","DOI":"10.1109\/NAFIPS.2012.6291011"},{"key":"e_1_3_2_2_74_1","first-page":"5998","volume-title":"Advances in neural information processing systems","author":"Vaswani Ashish","year":"2017","unstructured":"Ashish Vaswani , Noam Shazeer , Niki Parmar , Jakob Uszkoreit , Llion Jones , Aidan N Gomez , \u0141ukasz Kaiser , and Illia Polosukhin . Attention is all you need . In Advances in neural information processing systems , pages 5998 -- 6008 , 2017 . Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, \u0141ukasz Kaiser, and Illia Polosukhin. Attention is all you need. In Advances in neural information processing systems, pages 5998--6008, 2017."},{"key":"e_1_3_2_2_75_1","volume-title":"Proceedings of the 22nd International Conference on Extending Database Technology (EDBT)","author":"Wang Han","year":"2020","unstructured":"Han Wang , Yuan Hong , Yu Kong , and Jaideep Vaidya . Publishing video data with indistinguishable objects . In Proceedings of the 22nd International Conference on Extending Database Technology (EDBT) , 2020 . Han Wang, Yuan Hong, Yu Kong, and Jaideep Vaidya. Publishing video data with indistinguishable objects. In Proceedings of the 22nd International Conference on Extending Database Technology (EDBT), 2020."},{"key":"e_1_3_2_2_76_1","volume-title":"11th USENIX Workshop on Hot Topics in Cloud Computing (HotCloud 19)","author":"Wang Yiding","year":"2019","unstructured":"Yiding Wang , Weiyan Wang , Junxue Zhang , Junchen Jiang , and Kai Chen . Bridging the edge-cloud barrier for real-time advanced vision analytics . In 11th USENIX Workshop on Hot Topics in Cloud Computing (HotCloud 19) , 2019 . Yiding Wang, Weiyan Wang, Junxue Zhang, Junchen Jiang, and Kai Chen. Bridging the edge-cloud barrier for real-time advanced vision analytics. In 11th USENIX Workshop on Hot Topics in Cloud Computing (HotCloud 19), 2019."},{"key":"e_1_3_2_2_77_1","volume-title":"Object tracking: A survey. Acm computing surveys (CSUR), 38(4):13","author":"Yilmaz Alper","year":"2006","unstructured":"Alper Yilmaz , Omar Javed , and Mubarak Shah . Object tracking: A survey. Acm computing surveys (CSUR), 38(4):13 , 2006 . Alper Yilmaz, Omar Javed, and Mubarak Shah. Object tracking: A survey. Acm computing surveys (CSUR), 38(4):13, 2006."},{"key":"e_1_3_2_2_78_1","doi-asserted-by":"publisher","DOI":"10.1145\/3230543.3230554"},{"key":"e_1_3_2_2_79_1","first-page":"1","volume-title":"NSDI","volume":"9","author":"Zhang Haoyu","year":"2017","unstructured":"Haoyu Zhang , Ganesh Ananthanarayanan , Peter Bodik , Matthai Philipose , Paramvir Bahl , and Michael J Freedman . Live video analytics at scale with approximation and delay-tolerance . In NSDI , volume 9 , page 1 , 2017 . Haoyu Zhang, Ganesh Ananthanarayanan, Peter Bodik, Matthai Philipose, Paramvir Bahl, and Michael J Freedman. Live video analytics at scale with approximation and delay-tolerance. In NSDI, volume 9, page 1, 2017."},{"key":"e_1_3_2_2_80_1","doi-asserted-by":"publisher","DOI":"10.1145\/2789168.2790123"},{"key":"e_1_3_2_2_81_1","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM.2017.8057057"}],"event":{"name":"SIGCOMM '20: Annual conference of the ACM Special Interest Group on Data Communication on the applications, technologies, architectures, and protocols for computer communication","location":"Virtual Event USA","acronym":"SIGCOMM '20","sponsor":["SIGCOMM ACM Special Interest Group on Data Communication"]},"container-title":["Proceedings of the Annual conference of the ACM Special Interest Group on Data Communication on the applications, technologies, architectures, and protocols for computer communication"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3387514.3405887","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3387514.3405887","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3387514.3405887","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T22:41:36Z","timestamp":1750200096000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3387514.3405887"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,7,30]]},"references-count":80,"alternative-id":["10.1145\/3387514.3405887","10.1145\/3387514"],"URL":"https:\/\/doi.org\/10.1145\/3387514.3405887","relation":{},"subject":[],"published":{"date-parts":[[2020,7,30]]},"assertion":[{"value":"2020-07-30","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}