{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:09:29Z","timestamp":1750219769398,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":66,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,4,30]],"date-time":"2023-04-30T00:00:00Z","timestamp":1682812800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/501100001691","name":"Japan Society for the Promotion of Science","doi-asserted-by":"publisher","award":["21J22490"],"award-info":[{"award-number":["21J22490"]}],"id":[{"id":"10.13039\/501100001691","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,4,30]]},"DOI":"10.1145\/3543507.3583346","type":"proceedings-article","created":{"date-parts":[[2023,4,26]],"date-time":"2023-04-26T23:30:51Z","timestamp":1682551851000},"page":"1616-1625","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Active Learning from the Web"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6912-4464","authenticated-orcid":false,"given":"Ryoma","family":"Sato","sequence":"first","affiliation":[{"name":"Kyoto University, Japan and RIKEN AIP, Japan"}]}],"member":"320","published-online":{"date-parts":[[2023,4,30]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"14th Asian Conference on Computer Vision, ACCV, Vol.\u00a011363","author":"Akcay Samet","year":"2018","unstructured":"Samet Akcay, Amir\u00a0Atapour Abarghouei, and Toby\u00a0P. Breckon. 2018. GANomaly: Semi-supervised Anomaly Detection via Adversarial Training. In 14th Asian Conference on Computer Vision, ACCV, Vol.\u00a011363. Springer, 622\u2013637."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1007\/BF00116828"},{"key":"e_1_3_2_1_3_1","volume-title":"Uncertain Gradient Lower Bounds. In 8th International Conference on Learning Representations, ICLR.","author":"Ash T.","year":"2020","unstructured":"Jordan\u00a0T. Ash, Chicheng Zhang, Akshay Krishnamurthy, John Langford, and Alekh Agarwal. 2020. Deep Batch Active Learning by Diverse, Uncertain Gradient Lower Bounds. In 8th International Conference on Learning Representations, ICLR."},{"key":"e_1_3_2_1_4_1","unstructured":"Les\u00a0E. Atlas David\u00a0A. Cohn and Richard\u00a0E. Ladner. 1989. Training Connectionist Networks with Queries and Selective Sampling. In NeurIPS. 566\u2013573."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/2020408.2020443"},{"key":"e_1_3_2_1_6_1","unstructured":"Alexei Baevski Yuhao Zhou Abdelrahman Mohamed and Michael Auli. 2020. wav2vec 2.0: A Framework for Self-Supervised Learning of Speech Representations. In NeurIPS."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"crossref","unstructured":"Ricardo\u00a0A. Baeza-Yates Carlos Castillo Mauricio Mar\u00edn and M.\u00a0Andrea Rodr\u00edguez. 2005. Crawling a country: better strategies than breadth-first for web page ordering. In WWW. 864\u2013872.","DOI":"10.1145\/1062745.1062768"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"crossref","unstructured":"Luciano Barbosa and Juliana Freire. 2007. An adaptive crawler for locating hidden-web entry points. In WWW. 441\u2013450.","DOI":"10.1145\/1242572.1242632"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"crossref","unstructured":"William\u00a0H. Beluch Tim Genewein Andreas N\u00fcrnberger and Jan\u00a0M. K\u00f6hler. 2018. The Power of Ensembles for Active Learning in Image Classification. In CVPR. 9368\u20139377.","DOI":"10.1109\/CVPR.2018.00976"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1016\/0169-7552(94)90132-5"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.14778\/3476311.3476346"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1016\/S1389-1286(99)00052-3"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"crossref","unstructured":"Hao Chen Qi Dou Xi Wang Jing Qin and Pheng-Ann Heng. 2016. Mitosis Detection in Breast Cancer Histology Images via Deep Cascaded Networks. In AAAI. 1160\u20131166.","DOI":"10.1609\/aaai.v30i1.10140"},{"key":"e_1_3_2_1_14_1","unstructured":"Ting Chen Simon Kornblith Mohammad Norouzi and Geoffrey\u00a0E. Hinton. 2020. A Simple Framework for Contrastive Learning of Visual Representations. In ICML Vol.\u00a0119. PMLR 1597\u20131607."},{"key":"e_1_3_2_1_15_1","unstructured":"Gui Citovsky Giulia DeSalvo Claudio Gentile Lazaros Karydas Anand Rajagopalan Afshin Rostamizadeh and Sanjiv Kumar. 2021. Batch Active Learning at Scale. In NeurIPS. 11933\u201311944."},{"key":"e_1_3_2_1_16_1","volume-title":"BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding. In Proceedings of the 2019 Conference of the North American","author":"Devlin Jacob","year":"2019","unstructured":"Jacob Devlin, Ming-Wei Chang, Kenton Lee, and Kristina Toutanova. 2019. BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding. In Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL-HLT. Association for Computational Linguistics, 4171\u20134186."},{"key":"e_1_3_2_1_17_1","unstructured":"Prafulla Dhariwal and Alexander\u00a0Quinn Nichol. 2021. Diffusion Models Beat GANs on Image Synthesis. In NeurIPS. 8780\u20138794."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01421-6_11"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-1063"},{"key":"e_1_3_2_1_20_1","unstructured":"Yarin Gal Riashat Islam and Zoubin Ghahramani. 2017. Deep Bayesian Active Learning with Image Data. In ICML Vol.\u00a070. PMLR 1183\u20131192."},{"key":"e_1_3_2_1_21_1","unstructured":"Robert Geirhos Kantharaju Narayanappa Benjamin Mitzkus Tizian Thieringer Matthias Bethge Felix\u00a0A. Wichmann and Wieland Brendel. 2021. Partial success in closing the gap between human and machine vision. In NeurIPS. 23885\u201323899."},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"crossref","unstructured":"Ziyu Guan Can Wang Chun Chen Jiajun Bu and Junfeng Wang. 2008. Guide focused crawler efficiently and effectively using on-line topical importance estimation. In SIGIR. 757\u2013758.","DOI":"10.1145\/1390334.1390488"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2019\/343"},{"key":"e_1_3_2_1_24_1","unstructured":"Kaiming He Haoqi Fan Yuxin Wu Saining Xie and Ross\u00a0B. Girshick. 2020. Momentum Contrast for Unsupervised Visual Representation Learning. In CVPR. 9726\u20139735."},{"key":"e_1_3_2_1_25_1","unstructured":"Kaiming He Xiangyu Zhang Shaoqing Ren and Jian Sun. 2016. Deep Residual Learning for Image Recognition. In CVPR. 770\u2013778."},{"key":"e_1_3_2_1_26_1","volume-title":"Empirically. arXiv abs\/1712.00409","author":"Hestness Joel","year":"2017","unstructured":"Joel Hestness, Sharan Narang, Newsha Ardalani, Gregory\u00a0F. Diamos, Heewoo Jun, Hassan Kianinejad, Md. Mostofa\u00a0Ali Patwary, Yang Yang, and Yanqi Zhou. 2017. Deep Learning Scaling is Predictable, Empirically. arXiv abs\/1712.00409 (2017)."},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"crossref","unstructured":"Steven C.\u00a0H. Hoi Rong Jin Jianke Zhu and Michael\u00a0R. Lyu. 2006. Batch mode active learning and its application to medical image classification. In ICML Vol.\u00a0148. 417\u2013424.","DOI":"10.1145\/1143844.1143897"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2008.4563068"},{"key":"e_1_3_2_1_29_1","unstructured":"Judy Johnson Kostas Tsioutsiouliklis and C.\u00a0Lee Giles. 2003. Evolving Strategies for Focused Web Crawling. In ICML. 298\u2013305."},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"crossref","unstructured":"Ajay\u00a0J. Joshi Fatih Porikli and Nikolaos Papanikolopoulos. 2009. Multi-class active learning for image classification. In CVPR. 2372\u20132379.","DOI":"10.1109\/CVPR.2009.5206627"},{"key":"e_1_3_2_1_31_1","volume-title":"Scaling Laws for Neural Language Models. arXiv abs\/2001.08361","author":"Kaplan Jared","year":"2020","unstructured":"Jared Kaplan, Sam McCandlish, Tom Henighan, Tom\u00a0B. Brown, Benjamin Chess, Rewon Child, Scott Gray, Alec Radford, Jeffrey Wu, and Dario Amodei. 2020. Scaling Laws for Neural Language Models. arXiv abs\/2001.08361 (2020)."},{"key":"e_1_3_2_1_32_1","unstructured":"Andreas Kirsch Joost van Amersfoort and Yarin Gal. 2019. BatchBALD: Efficient and Diverse Batch Acquisition for Deep Bayesian Active Learning. In NeurIPS. 7024\u20137035."},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-020-01316-z"},{"volume-title":"Proceedings of the 17th Annual International ACM-SIGIR Conference on Research and Development in Information Retrieval, SIGIR. ACM, 3\u201312","author":"D.","key":"e_1_3_2_1_34_1","unstructured":"David\u00a0D. Lewis and William\u00a0A. Gale. 1994. A Sequential Algorithm for Training Text Classifiers. In Proceedings of the 17th Annual International ACM-SIGIR Conference on Research and Development in Information Retrieval, SIGIR. ACM, 3\u201312."},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"crossref","unstructured":"Lihong Li Wei Chu John Langford and Robert\u00a0E. Schapire. 2010. A contextual-bandit approach to personalized news article recommendation. In WWW. 661\u2013670.","DOI":"10.1145\/1772690.1772758"},{"key":"e_1_3_2_1_36_1","volume-title":"Learning Without Forgetting. In 14th European Conference","author":"Li Zhizhong","year":"2016","unstructured":"Zhizhong Li and Derek Hoiem. 2016. Learning Without Forgetting. In 14th European Conference, Amsterdam, The Netherlands, ECCV, Vol.\u00a09908. Springer, 614\u2013629."},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"crossref","unstructured":"Julian\u00a0J. McAuley Christopher Targett Qinfeng Shi and Anton van\u00a0den Hengel. 2015. Image-Based Recommendations on Styles and Substitutes. In SIGIR. 43\u201352.","DOI":"10.1145\/2766462.2767755"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1023\/A:1009953814988"},{"key":"e_1_3_2_1_39_1","volume-title":"Focused Crawling for Structured Data. In The 23rd ACM International Conference on Information and Knowledge Management, CIKM. 1039\u20131048","author":"Meusel Robert","year":"2014","unstructured":"Robert Meusel, Peter Mika, and Roi Blanco. 2014. Focused Crawling for Structured Data. In The 23rd ACM International Conference on Information and Knowledge Management, CIKM. 1039\u20131048."},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10994-021-06003-9"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1162"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"crossref","unstructured":"Kien Pham A\u00e9cio S.\u00a0R. Santos and Juliana Freire. 2019. Bootstrapping Domain-Specific Content Discovery on the Web. In WWW. ACM 1476\u20131486.","DOI":"10.1145\/3308558.3313709"},{"key":"e_1_3_2_1_43_1","volume-title":"PMLR","author":"Raj Anant","year":"2022","unstructured":"Anant Raj and Francis\u00a0R. Bach. 2022. Convergence of Uncertainty Sampling for Active Learning. In ICML, Vol.\u00a0162. PMLR, 18310\u201318331."},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"crossref","unstructured":"Robin Rombach Andreas Blattmann Dominik Lorenz Patrick Esser and Bj\u00f6rn Ommer. 2022. High-Resolution Image Synthesis with Latent Diffusion Models. In CVPR. 10674\u201310685.","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"e_1_3_2_1_45_1","volume-title":"8th International Conference on Learning Representations, ICLR.","author":"Rosenfeld S.","year":"2020","unstructured":"Jonathan\u00a0S. Rosenfeld, Amir Rosenfeld, Yonatan Belinkov, and Nir Shavit. 2020. A Constructive Prediction of the Generalization Error Across Scales. In 8th International Conference on Learning Representations, ICLR."},{"key":"e_1_3_2_1_46_1","unstructured":"Nicholas Roy and Andrew McCallum. 2001. Toward Optimal Active Learning through Sampling Estimation of Error Reduction. In ICML. 441\u2013448."},{"key":"e_1_3_2_1_47_1","volume-title":"Deep Semi-Supervised Anomaly Detection. In 8th International Conference on Learning Representations, ICLR.","author":"Ruff Lukas","year":"2020","unstructured":"Lukas Ruff, Robert\u00a0A. Vandermeulen, Nico G\u00f6rnitz, Alexander Binder, Emmanuel M\u00fcller, Klaus-Robert M\u00fcller, and Marius Kloft. 2020. Deep Semi-Supervised Anomaly Detection. In 8th International Conference on Learning Representations, ICLR."},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"e_1_3_2_1_49_1","volume-title":"CLEAR: A Fully User-side Image Search System. In The 31st ACM International Conference on Information and Knowledge Management, CIKM.","author":"Sato Ryoma","year":"2022","unstructured":"Ryoma Sato. 2022. CLEAR: A Fully User-side Image Search System. In The 31st ACM International Conference on Information and Knowledge Management, CIKM."},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1137\/1.9781611977172.62"},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"crossref","unstructured":"Ryoma Sato. 2022. Retrieving Black-box Optimal Images from External Databases. In WSDM. ACM 879\u2013887.","DOI":"10.1145\/3488560.3498462"},{"key":"e_1_3_2_1_52_1","volume-title":"Towards Principled User-side Recommender Systems. In The 31st ACM International Conference on Information and Knowledge Management, CIKM.","author":"Sato Ryoma","year":"2022","unstructured":"Ryoma Sato. 2022. Towards Principled User-side Recommender Systems. In The 31st ACM International Conference on Information and Knowledge Management, CIKM."},{"key":"e_1_3_2_1_53_1","volume-title":"Active Learning for Convolutional Neural Networks: A Core-Set Approach. In 6th International Conference on Learning Representations, ICLR.","author":"Sener Ozan","year":"2018","unstructured":"Ozan Sener and Silvio Savarese. 2018. Active Learning for Convolutional Neural Networks: A Core-Set Approach. In 6th International Conference on Learning Representations, ICLR."},{"key":"e_1_3_2_1_54_1","unstructured":"Burr Settles. 2009. Active learning literature survey. (2009)."},{"volume-title":"NeurIPS. Curran Associates","author":"Settles Burr","key":"e_1_3_2_1_55_1","unstructured":"Burr Settles, Mark Craven, and Soumya Ray. 2007. Multiple-Instance Active Learning. In NeurIPS. Curran Associates, Inc., 1289\u20131296."},{"key":"e_1_3_2_1_56_1","volume-title":"Deep Active Learning: Unified and Principled Method for Query and Training. In The 23rd International Conference on Artificial Intelligence and Statistics, AISTATS, Vol.\u00a0108","author":"Shui Changjian","year":"2020","unstructured":"Changjian Shui, Fan Zhou, Christian Gagn\u00e9, and Boyu Wang. 2020. Deep Active Learning: Unified and Principled Method for Query and Training. In The 23rd International Conference on Artificial Intelligence and Statistics, AISTATS, Vol.\u00a0108. PMLR, 1308\u20131318."},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"crossref","unstructured":"Hyun\u00a0Oh Song Yu Xiang Stefanie Jegelka and Silvio Savarese. 2016. Deep Metric Learning via Lifted Structured Feature Embedding. In CVPR. 4004\u20134012.","DOI":"10.1109\/CVPR.2016.434"},{"key":"e_1_3_2_1_58_1","first-page":"45","article-title":"Support Vector Machine Active Learning with Applications to Text Classification","volume":"2","author":"Tong Simon","year":"2001","unstructured":"Simon Tong and Daphne Koller. 2001. Support Vector Machine Active Learning with Applications to Text Classification. J. Mach. Learn. Res. 2 (2001), 45\u201366.","journal-title":"J. Mach. Learn. Res."},{"key":"e_1_3_2_1_59_1","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2016.2589879"},{"key":"e_1_3_2_1_60_1","doi-asserted-by":"crossref","unstructured":"Yue Wu Yinpeng Chen Lijuan Wang Yuancheng Ye Zicheng Liu Yandong Guo and Yun Fu. 2019. Large Scale Incremental Learning. In CVPR. 374\u2013382.","DOI":"10.1109\/CVPR.2019.00046"},{"key":"e_1_3_2_1_61_1","doi-asserted-by":"crossref","unstructured":"Qihang Yu Lingxi Xie Yan Wang Yuyin Zhou Elliot\u00a0K. Fishman and Alan\u00a0L. Yuille. 2018. Recurrent Saliency Transformation Network: Incorporating Multi-Stage Visual Cues for Small Organ Segmentation. In CVPR. 8280\u20138289.","DOI":"10.1109\/CVPR.2018.00864"},{"key":"e_1_3_2_1_62_1","unstructured":"Friedemann Zenke Ben Poole and Surya Ganguli. 2017. Continual Learning Through Synaptic Intelligence. In ICML Vol.\u00a070. PMLR 3987\u20133995."},{"key":"e_1_3_2_1_63_1","doi-asserted-by":"crossref","unstructured":"Xiaohua Zhai Alexander Kolesnikov Neil Houlsby and Lucas Beyer. 2022. Scaling Vision Transformers. In CVPR. 1204\u20131213.","DOI":"10.1109\/CVPR52688.2022.01179"},{"key":"e_1_3_2_1_64_1","doi-asserted-by":"publisher","DOI":"10.1145\/3459637.3482427"},{"key":"e_1_3_2_1_65_1","volume-title":"Generative Adversarial Active Learning. arXiv abs\/1702.07956","author":"Zhu Jia-Jie","year":"2017","unstructured":"Jia-Jie Zhu and Jos\u00e9 Bento. 2017. Generative Adversarial Active Learning. arXiv abs\/1702.07956 (2017)."},{"key":"e_1_3_2_1_66_1","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2012.2236570"}],"event":{"name":"WWW '23: The ACM Web Conference 2023","sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web"],"location":"Austin TX USA","acronym":"WWW '23"},"container-title":["Proceedings of the ACM Web Conference 2023"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3543507.3583346","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3543507.3583346","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T16:37:23Z","timestamp":1750178243000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3543507.3583346"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,4,30]]},"references-count":66,"alternative-id":["10.1145\/3543507.3583346","10.1145\/3543507"],"URL":"https:\/\/doi.org\/10.1145\/3543507.3583346","relation":{},"subject":[],"published":{"date-parts":[[2023,4,30]]},"assertion":[{"value":"2023-04-30","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}