{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,8]],"date-time":"2026-04-08T08:54:32Z","timestamp":1775638472978,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":58,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,3,8]],"date-time":"2021-03-08T00:00:00Z","timestamp":1615161600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,3,8]]},"DOI":"10.1145\/3437963.3441810","type":"proceedings-article","created":{"date-parts":[[2021,3,6]],"date-time":"2021-03-06T04:34:28Z","timestamp":1615005268000},"page":"31-39","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":51,"title":["DeepXML: A Deep Extreme Multi-Label Learning Framework Applied to Short Text Documents"],"prefix":"10.1145","author":[{"given":"Kunal","family":"Dahiya","sequence":"first","affiliation":[{"name":"IIT Delhi, Delhi, India"}]},{"given":"Deepak","family":"Saini","sequence":"additional","affiliation":[{"name":"Microsoft Research, Bengaluru, India"}]},{"given":"Anshul","family":"Mittal","sequence":"additional","affiliation":[{"name":"IIT Delhi, Delhi, India"}]},{"given":"Ankush","family":"Shaw","sequence":"additional","affiliation":[{"name":"IIT Delhi, Delhi, India"}]},{"given":"Kushal","family":"Dave","sequence":"additional","affiliation":[{"name":"Microsoft, Sunnyvale, CA, USA"}]},{"given":"Akshay","family":"Soni","sequence":"additional","affiliation":[{"name":"Microsoft, Sunnyvale, CA, USA"}]},{"given":"Himanshu","family":"Jain","sequence":"additional","affiliation":[{"name":"IIT Delhi, Delhi, India"}]},{"given":"Sumeet","family":"Agarwal","sequence":"additional","affiliation":[{"name":"IIT Delhi, Delhi, India"}]},{"given":"Manik","family":"Varma","sequence":"additional","affiliation":[{"name":"Microsoft Research &amp; IIT Delhi, Bengaluru, India"}]}],"member":"320","published-online":{"date-parts":[[2021,3,8]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"crossref","unstructured":"R. Agrawal A. Gupta Y. Prabhu and M. Varma. 2013. Multi-label learning with millions of labels: Recommending advertiser bid phrases for web pages. In WWW.  R. Agrawal A. Gupta Y. Prabhu and M. Varma. 2013. Multi-label learning with millions of labels: Recommending advertiser bid phrases for web pages. In WWW.","DOI":"10.1145\/2488388.2488391"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"crossref","unstructured":"R. Babbar and B. Sch\u00f6lkopf. 2017. DiSMEC: Distributed Sparse Machines for Extreme Multi-label Classification. In WSDM.  R. Babbar and B. Sch\u00f6lkopf. 2017. DiSMEC: Distributed Sparse Machines for Extreme Multi-label Classification. In WSDM.","DOI":"10.1145\/3018661.3018741"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"crossref","unstructured":"R. Babbar and B. Sch\u00f6lkopf. 2019. Data scarcity robustness and extreme multi-label classification. ML (2019).  R. Babbar and B. Sch\u00f6lkopf. 2019. Data scarcity robustness and extreme multi-label classification. ML (2019).","DOI":"10.1007\/s10994-019-05791-5"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"crossref","unstructured":"X. Bai E. Ordentlich Y. Zhang A. Feng A. Ratnaparkhi R. Somvanshi and A. Tjahjadi. 2018. Scalable Query N-Gram Embedding for Improving Matching and Relevance in Sponsored Search. In KDD.  X. Bai E. Ordentlich Y. Zhang A. Feng A. Ratnaparkhi R. Somvanshi and A. Tjahjadi. 2018. Scalable Query N-Gram Embedding for Improving Matching and Relevance in Sponsored Search. In KDD.","DOI":"10.1145\/3219819.3219897"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"crossref","unstructured":"E. J. Barezi I. D. W. P. Fung and H. R. Rabiee. 2019. A Submodular Feature-Aware Framework for Label Subset Selection in Extreme Classification Problems. In NAACL.  E. J. Barezi I. D. W. P. Fung and H. R. Rabiee. 2019. A Submodular Feature-Aware Framework for Label Subset Selection in Extreme Classification Problems. In NAACL.","DOI":"10.18653\/v1\/N19-1106"},{"key":"e_1_3_2_1_6_1","unstructured":"K. Bhatia K. Dahiya H. Jain A. Mittal Y. Prabhu and M. Varma. 2016. The Extreme Classification Repository: Multi-label Datasets & Code. http:\/\/manikvarma.org\/downloads\/XC\/XMLRepository.html  K. Bhatia K. Dahiya H. Jain A. Mittal Y. Prabhu and M. Varma. 2016. The Extreme Classification Repository: Multi-label Datasets & Code. http:\/\/manikvarma.org\/downloads\/XC\/XMLRepository.html"},{"key":"e_1_3_2_1_7_1","unstructured":"K. Bhatia H. Jain P. Kar M. Varma and P. Jain. 2015. Sparse Local Embeddings for Extreme Multi-label Classification. In NeurIPS.  K. Bhatia H. Jain P. Kar M. Varma and P. Jain. 2015. Sparse Local Embeddings for Extreme Multi-label Classification. In NeurIPS."},{"key":"e_1_3_2_1_8_1","volume":"201","author":"Bi W.","unstructured":"W. Bi and J. Kwok. 201 3. Efficient multi-label classification with many labels. In ICML. W. Bi and J. Kwok. 2013. Efficient multi-label classification with many labels. In ICML.","journal-title":"J. Kwok."},{"key":"e_1_3_2_1_9_1","volume":"200","author":"Broder A.","unstructured":"A. Broder , P. Ciccolo , E. Gabrilovich , V. Josifovski , D. Metzler , L. Riedel , and J. Yuan. 200 9. Online Expansion of Rare Queries for Sponsored Search. In WWW. A. Broder, P. Ciccolo, E. Gabrilovich, V. Josifovski, D. Metzler, L. Riedel, and J. Yuan. 2009. Online Expansion of Rare Queries for Sponsored Search. In WWW.","journal-title":"J. Yuan."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"crossref","unstructured":"I. Chalkidis M. Fergadiotis P. Malakasiotis N. Aletras and I. Androutsopoulos. 2019. Extreme Multi-Label Legal Text Classification: A case study in EU Legislation. In NAACL.  I. Chalkidis M. Fergadiotis P. Malakasiotis N. Aletras and I. Androutsopoulos. 2019. Extreme Multi-Label Legal Text Classification: A case study in EU Legislation. In NAACL.","DOI":"10.18653\/v1\/W19-2209"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"crossref","unstructured":"W.-C. Chang Yu H.-F. K. Zhong Y. Yang and I.-S. Dhillon. 2020 a. Taming Pretrained Transformers for Extreme Multi-label Text Classification. In KDD.  W.-C. Chang Yu H.-F. K. Zhong Y. Yang and I.-S. Dhillon. 2020 a. Taming Pretrained Transformers for Extreme Multi-label Text Classification. In KDD.","DOI":"10.1145\/3394486.3403368"},{"key":"e_1_3_2_1_12_1","unstructured":"W-C. Chang F.-X. Yu Y.-W. Chang Y. Yang and S. Kumar. 2020 b. Pre-training Tasks for Embedding-based Large-scale Retrieval. In ICLR.  W-C. Chang F.-X. Yu Y.-W. Chang Y. Yang and S. Kumar. 2020 b. Pre-training Tasks for Embedding-based Large-scale Retrieval. In ICLR."},{"key":"e_1_3_2_1_13_1","volume-title":"BERT: Pre-training of deep bidirectional transformers for language understanding. NAACL","author":"Devlin J.","year":"2019","unstructured":"J. Devlin , M. W. Chang , K. Lee , and K. Toutanova . 2019 . BERT: Pre-training of deep bidirectional transformers for language understanding. NAACL (2019). J. Devlin, M. W. Chang, K. Lee, and K. Toutanova. 2019. BERT: Pre-training of deep bidirectional transformers for language understanding. NAACL (2019)."},{"key":"e_1_3_2_1_14_1","unstructured":"J. Gao S. Xie X. He and A. Ali. 2012. Learning Lexicon Models from Search Logs for Query Expansion. In EMNLP.  J. Gao S. Xie X. He and A. Ali. 2012. Learning Lexicon Models from Search Logs for Query Expansion. In EMNLP."},{"key":"e_1_3_2_1_15_1","unstructured":"C. Guo A. Mousavi X. Wu D.-N. Holtmann-Rice S. Kale S. Reddi and S. Kumar. 2019. Breaking the Glass Ceiling for Embedding-Based Classifiers for Large Output Spaces. In NeurIPS.  C. Guo A. Mousavi X. Wu D.-N. Holtmann-Rice S. Kale S. Reddi and S. Kumar. 2019. Breaking the Glass Ceiling for Embedding-Based Classifiers for Large Output Spaces. In NeurIPS."},{"key":"e_1_3_2_1_16_1","volume":"201","author":"He K.","unstructured":"K. He , X. Zhang , S. Ren , and J. Sun. 201 6. Deep Residual Learning for Image Recognition. In CVPR. K. He, X. Zhang, S. Ren, and J. Sun. 2016. Deep Residual Learning for Image Recognition. In CVPR.","journal-title":"J. Sun."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"crossref","unstructured":"P. S. Huang X. He J. Gao L. Deng A. Acero and L. Heck. 2013. Learning Deep Structured Semantic Models for Web Search using Clickthrough Data. In CIKM.  P. S. Huang X. He J. Gao L. Deng A. Acero and L. Heck. 2013. Learning Deep Structured Semantic Models for Web Search using Clickthrough Data. In CIKM.","DOI":"10.1145\/2505515.2505665"},{"key":"e_1_3_2_1_18_1","unstructured":"A. Ioannis G. M. Hector and C. C. Chi. 2008. Simrank+: Query Rewriting through Link Analysis of the Click Graph. In WWW.  A. Ioannis G. M. Hector and C. C. Chi. 2008. Simrank+: Query Rewriting through Link Analysis of the Click Graph. In WWW."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1145\/3289600.3290979"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"crossref","unstructured":"H. Jain Y. Prabhu and M. Varma. 2016. Extreme Multi-label Loss Functions for Recommendation Tagging Ranking and Other Missing Label Applications. In KDD.  H. Jain Y. Prabhu and M. Varma. 2016. Extreme Multi-label Loss Functions for Recommendation Tagging Ranking and Other Missing Label Applications. In KDD.","DOI":"10.1145\/2939672.2939756"},{"key":"e_1_3_2_1_21_1","unstructured":"K. Jasinska K. Dembczynski R. Busa-Fekete K. Pfannschmidt T. Klerx and E. Hullermeier. 2016. Extreme F-measure Maximization using Sparse Probability Estimates. In ICML.  K. Jasinska K. Dembczynski R. Busa-Fekete K. Pfannschmidt T. Klerx and E. Hullermeier. 2016. Extreme F-measure Maximization using Sparse Probability Estimates. In ICML."},{"key":"e_1_3_2_1_22_1","unstructured":"Y. Jernite A. Choromanska and D. Sontag. 2017. Simultaneous Learning of Trees and Representations for Extreme Classification and Density Estimation. In ICML.  Y. Jernite A. Choromanska and D. Sontag. 2017. Simultaneous Learning of Trees and Representations for Extreme Classification and Density Estimation. In ICML."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"crossref","unstructured":"A. Joulin E. Grave P. Bojanowski and T. Mikolov. 2017. Bag of Tricks for Efficient Text Classification. In EACL.  A. Joulin E. Grave P. Bojanowski and T. Mikolov. 2017. Bag of Tricks for Efficient Text Classification. In EACL.","DOI":"10.18653\/v1\/E17-2068"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"crossref","unstructured":"S. Khandagale H. Xiao and R. Babbar. 2019. Bonsai - Diverse and Shallow Trees for Extreme Multi-label Classification. Machine Learning (2019).  S. Khandagale H. Xiao and R. Babbar. 2019. Bonsai - Diverse and Shallow Trees for Extreme Multi-label Classification. Machine Learning (2019).","DOI":"10.1007\/s10994-020-05888-2"},{"key":"e_1_3_2_1_25_1","volume":"201","author":"Krichene W.","unstructured":"W. Krichene , N. Mayoraz , S. Rendle , L. Zhang , X. Yi , L. Hong , E. Chi , and J. Anderson. 201 9. Efficient training on very large corpora via gramian estimation. In ICLR. W. Krichene, N. Mayoraz, S. Rendle, L. Zhang, X. Yi, L. Hong, E. Chi, and J. Anderson. 2019. Efficient training on very large corpora via gramian estimation. In ICLR.","journal-title":"J. Anderson."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"crossref","unstructured":"M. C. Lee B. Gao and R. Zhang. 2018. Rare Query Expansion Through Generative Adversarial Networks in Search Advertising. In KDD.  M. C. Lee B. Gao and R. Zhang. 2018. Rare Query Expansion Through Generative Adversarial Networks in Search Advertising. In KDD.","DOI":"10.1145\/3219819.3219850"},{"key":"e_1_3_2_1_27_1","unstructured":"Y. Lian Z. Chen J. Hu K. Zhang C. Yan M. Tong W. Han H. Guan Y. Li Y. Cao Y. Yu Z. Li X. Liu and Y. Wang. 2019. An end-to-end Generative Retrieval Method for Sponsored Search Engine -Decoding Efficiently into a Closed Target Domain. CoRR (2019).  Y. Lian Z. Chen J. Hu K. Zhang C. Yan M. Tong W. Han H. Guan Y. Li Y. Cao Y. Yu Z. Li X. Liu and Y. Wang. 2019. An end-to-end Generative Retrieval Method for Sponsored Search Engine -Decoding Efficiently into a Closed Target Domain. CoRR (2019)."},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"crossref","unstructured":"J. Liu W. Chang Y. Wu and Y. Yang. 2017. Deep Learning for Extreme Multi-label Text Classification. In SIGIR.  J. Liu W. Chang Y. Wu and Y. Yang. 2017. Deep Learning for Extreme Multi-label Text Classification. In SIGIR.","DOI":"10.1145\/3077136.3080834"},{"key":"e_1_3_2_1_29_1","first-page":"i","volume":"2019","author":"Liu X.","unstructured":"X. Liu , P. He , W. Chen , and J. Gao. 2019 a. Mult i -Task Deep Neural Networks for Natural Language Understanding. In ACL. X. Liu, P. He, W. Chen, and J. Gao. 2019 a. Multi-Task Deep Neural Networks for Natural Language Understanding. In ACL.","journal-title":"J. Gao."},{"key":"e_1_3_2_1_30_1","volume-title":"2019 b. Roberta: A robustly optimized bert pretraining approach. CoRR","author":"Liu Y.","year":"2019","unstructured":"Y. Liu , M. Ott , N. Goyal , J. Du , M. Joshi , D. Chen , O. Levy , M. Lewis , L. Zettlemoyer , and V. Stoyanov . 2019 b. Roberta: A robustly optimized bert pretraining approach. CoRR ( 2019 ). Y. Liu, M. Ott, N. Goyal, J. Du, M. Joshi, D. Chen, O. Levy, M. Lewis, L. Zettlemoyer, and V. Stoyanov. 2019 b. Roberta: A robustly optimized bert pretraining approach. CoRR (2019)."},{"key":"e_1_3_2_1_31_1","unstructured":"A. Y. Malkov and D. A. Yashunin. 2016. Efficient and robust approximate nearest neighbor search using Hierarchical Navigable Small World graphs. CoRR (2016).  A. Y. Malkov and D. A. Yashunin. 2016. Efficient and robust approximate nearest neighbor search using Hierarchical Navigable Small World graphs. CoRR (2016)."},{"key":"e_1_3_2_1_32_1","unstructured":"T. K. R. Medini Q. Huang Y. Wang V. Mohan and A. Shrivastava. 2019. Extreme Classification in Log Memory using Count-Min Sketch: A Case Study of Amazon Search with 50M Products. In NeurIPS.  T. K. R. Medini Q. Huang Y. Wang V. Mohan and A. Shrivastava. 2019. Extreme Classification in Log Memory using Count-Min Sketch: A Case Study of Amazon Search with 50M Products. In NeurIPS."},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"crossref","unstructured":"Q. Mei D. Zhou and K. Church. 2008. Query Suggestion Using Hitting Time. In CIKM.  Q. Mei D. Zhou and K. Church. 2008. Query Suggestion Using Hitting Time. In CIKM.","DOI":"10.1145\/1458082.1458145"},{"key":"e_1_3_2_1_34_1","volume":"201","author":"Mikolov T.","unstructured":"T. Mikolov , I. Sutskever , K. Chen , G. Corrado , and J. Dean. 201 3. Distributed Representations of Words and Phrases and Their Compositionality. In NeurIPS. T. Mikolov, I. Sutskever, K. Chen, G. Corrado, and J. Dean. 2013. Distributed Representations of Words and Phrases and Their Compositionality. In NeurIPS.","journal-title":"J. Dean."},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"crossref","unstructured":"P. Mineiro and N. Karampatziakis. 2015. Fast Label Embeddings via Randomized Linear Algebra. In ECML\/PKDD.  P. Mineiro and N. Karampatziakis. 2015. Fast Label Embeddings via Randomized Linear Algebra. In ECML\/PKDD.","DOI":"10.1007\/978-3-319-23528-8_3"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"crossref","unstructured":"A. Mittal K. Dahiya S. Agrawal D. Saini S. Agarwal P. Kar and M. Varma. 2021 a. DECAF: Deep Extreme Classification with Label Features. In WSDM.  A. Mittal K. Dahiya S. Agrawal D. Saini S. Agarwal P. Kar and M. Varma. 2021 a. DECAF: Deep Extreme Classification with Label Features. In WSDM.","DOI":"10.1145\/3442381.3449815"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"crossref","unstructured":"A. Mittal N. Sachdeva S. Agrawal S. Agarwal P. Kar and M. Varma. 2021 b. ECLARE: Extreme Classification with Label Graph Correlations. In TheWebConf.  A. Mittal N. Sachdeva S. Agrawal S. Agarwal P. Kar and M. Varma. 2021 b. ECLARE: Extreme Classification with Label Graph Correlations. In TheWebConf.","DOI":"10.1145\/3442381.3449815"},{"key":"e_1_3_2_1_38_1","unstructured":"T. Miyato T. Kataoka M. Koyama and Y. Yoshida. 2018. Spectral Normalization for Generative Adversarial Networks. CoRR (2018).  T. Miyato T. Kataoka M. Koyama and Y. Yoshida. 2018. Spectral Normalization for Generative Adversarial Networks. CoRR (2018)."},{"key":"e_1_3_2_1_39_1","unstructured":"S. J. Pan and Q. Yang. 2010. A Survey on Transfer Learning. TKDE (2010).  S. J. Pan and Q. Yang. 2010. A Survey on Transfer Learning. TKDE (2010)."},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"crossref","unstructured":"Y. Prabhu A. Kag S. Gopinath K. Dahiya S. Harsola R. Agrawal and M. Varma. 2018a. Extreme multi-label learning with label features for warm-start tagging ranking and recommendation. In WSDM.  Y. Prabhu A. Kag S. Gopinath K. Dahiya S. Harsola R. Agrawal and M. Varma. 2018a. Extreme multi-label learning with label features for warm-start tagging ranking and recommendation. In WSDM.","DOI":"10.1145\/3159652.3159660"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1145\/3178876.3185998"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"crossref","unstructured":"Y. Prabhu and M. Varma. 2014. FastXML: A Fast Accurate and Stable Tree-classifier for eXtreme Multi-label Learning. In KDD.  Y. Prabhu and M. Varma. 2014. FastXML: A Fast Accurate and Stable Tree-classifier for eXtreme Multi-label Learning. In KDD.","DOI":"10.1145\/2623330.2623651"},{"key":"e_1_3_2_1_43_1","unstructured":"A. S Rawat J. J. Chen F. Yu Suresh A. .T and S. Kumar. 2019. Sampled softmax with random fourier features. In NeurIPS.  A. S Rawat J. J. Chen F. Yu Suresh A. .T and S. Kumar. 2019. Sampled softmax with random fourier features. In NeurIPS."},{"key":"e_1_3_2_1_44_1","volume-title":"Sentence-bert: Sentence embeddings using siamese bert-networks. EMNLP.","author":"Reimers N.","year":"2019","unstructured":"N. Reimers and I. Gurevych . 2019 . Sentence-bert: Sentence embeddings using siamese bert-networks. EMNLP. N. Reimers and I. Gurevych. 2019. Sentence-bert: Sentence embeddings using siamese bert-networks. EMNLP."},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"crossref","unstructured":"D. Saini A.K. Jain Kushal. Dave J. Jiao A. Singh R. Zhang and M. Varma. 2021. GalaXC: Graph neural networks with labelwise attention for extreme classification. In TheWebConf.  D. Saini A.K. Jain Kushal. Dave J. Jiao A. Singh R. Zhang and M. Varma. 2021. GalaXC: Graph neural networks with labelwise attention for extreme classification. In TheWebConf.","DOI":"10.1145\/3442381.3449937"},{"key":"e_1_3_2_1_46_1","unstructured":"W. Siblini P. Kuntz and F. Meyer. 2018. CRAFTML an Efficient Clustering-based Random Forest for Extreme Multi-label Learning. In ICML.  W. Siblini P. Kuntz and F. Meyer. 2018. CRAFTML an Efficient Clustering-based Random Forest for Extreme Multi-label Learning. In ICML."},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"crossref","unstructured":"Y. Tagami. 2017. AnnexML: Approximate Nearest Neighbor Search for Extreme Multi-label Classification. In KDD.  Y. Tagami. 2017. AnnexML: Approximate Nearest Neighbor Search for Extreme Multi-label Classification. In KDD.","DOI":"10.1145\/3097983.3097987"},{"key":"e_1_3_2_1_48_1","unstructured":"Y. X. Wang D. Ramanan and M. Hebert. 2017. Learning to Model the Tail. In NeurIPS.  Y. X. Wang D. Ramanan and M. Hebert. 2017. Learning to Model the Tail. In NeurIPS."},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"crossref","unstructured":"T. Wei W. W. Tu and Y. F. Li. 2019. Learning for Tail Label Data: A Label-Specific Feature Approach. In IJCAI.  T. Wei W. W. Tu and Y. F. Li. 2019. Learning for Tail Label Data: A Label-Specific Feature Approach. In IJCAI.","DOI":"10.24963\/ijcai.2019\/533"},{"key":"e_1_3_2_1_50_1","unstructured":"M. Wydmuch K. Jasinska M. Kuznetsov R. Busa-Fekete and K. Dembczynski. 2018. A no-regret generalization of hierarchical softmax to extreme multi-label classification. In NeurIPS.  M. Wydmuch K. Jasinska M. Kuznetsov R. Busa-Fekete and K. Dembczynski. 2018. A no-regret generalization of hierarchical softmax to extreme multi-label classification. In NeurIPS."},{"key":"e_1_3_2_1_51_1","unstructured":"H. Ye Z. Chen D.-H. Wang and B. D. Davison. 2020. Pretrained Generalized Autoregressive Model with Adaptive Probabilistic Label Clusters for Extreme Multi-label Text Classification. In ICML.  H. Ye Z. Chen D.-H. Wang and B. D. Davison. 2020. Pretrained Generalized Autoregressive Model with Adaptive Probabilistic Label Clusters for Extreme Multi-label Text Classification. In ICML."},{"key":"e_1_3_2_1_52_1","unstructured":"C. Yejin F. Marcus G. Evgeniy Vanja. J. M. Mauricio and P. Bo. 2010. Using Landing Pages for Sponsored Search Ad Selection. In WWW.  C. Yejin F. Marcus G. Evgeniy Vanja. J. M. Mauricio and P. Bo. 2010. Using Landing Pages for Sponsored Search Ad Selection. In WWW."},{"key":"e_1_3_2_1_53_1","unstructured":"E.H. I. Yen X. Huang K. Zhong P. Ravikumar and I. S. Dhillon. 2016. PD-Sparse: A Primal and Dual Sparse Approach to Extreme Multiclass and Multilabel Classification. In ICML.  E.H. I. Yen X. Huang K. Zhong P. Ravikumar and I. S. Dhillon. 2016. PD-Sparse: A Primal and Dual Sparse Approach to Extreme Multiclass and Multilabel Classification. In ICML."},{"key":"e_1_3_2_1_54_1","unstructured":"I. Yen S. Kale F. Yu D. Holtmann R. S. Kumar and P. Ravikumar. 2018. Loss Decomposition for Fast Learning in Large Output Spaces. In ICML.  I. Yen S. Kale F. Yu D. Holtmann R. S. Kumar and P. Ravikumar. 2018. Loss Decomposition for Fast Learning in Large Output Spaces. In ICML."},{"key":"e_1_3_2_1_55_1","doi-asserted-by":"crossref","unstructured":"X. Yi J. Yang L. Hong D. Z. Cheng L. Heldt A. Kumthekar Z. Zhao L. Wei and E. Chi. 2019. Sampling-Bias-Corrected Neural Modeling for Large Corpus Item Recommendations. In RecSys.  X. Yi J. Yang L. Hong D. Z. Cheng L. Heldt A. Kumthekar Z. Zhao L. Wei and E. Chi. 2019. Sampling-Bias-Corrected Neural Modeling for Large Corpus Item Recommendations. In RecSys.","DOI":"10.1145\/3298689.3346996"},{"key":"e_1_3_2_1_56_1","unstructured":"R. You S. Dai Z. Zhang H. Mamitsuka and S. Zhu. 2019. AttentionXML: Extreme Multi-Label Text Classification with Multi-Label Attention Based Recurrent Neural Networks. In NeurIPS.  R. You S. Dai Z. Zhang H. Mamitsuka and S. Zhu. 2019. AttentionXML: Extreme Multi-Label Text Classification with Multi-Label Attention Based Recurrent Neural Networks. In NeurIPS."},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"crossref","unstructured":"Z. Yuan Z. Guo Yu X. X. Wang and T. Yang. 2020. Accelerating Deep Learning with Millions of Classes. In ECCV.  Z. Yuan Z. Guo Yu X. X. Wang and T. Yang. 2020. Accelerating Deep Learning with Millions of Classes. In ECCV.","DOI":"10.1007\/978-3-030-58592-1_42"},{"key":"e_1_3_2_1_58_1","doi-asserted-by":"crossref","unstructured":"H. Zhou M. Huang Y. Mao C. Zhu P. Shu and X. Zhu. 2019. Domain-Constrained Advertising Keyword Generation. In WWW.  H. Zhou M. Huang Y. Mao C. Zhu P. Shu and X. Zhu. 2019. Domain-Constrained Advertising Keyword Generation. In WWW.","DOI":"10.1145\/3308558.3313570"}],"event":{"name":"WSDM '21: The Fourteenth ACM International Conference on Web Search and Data Mining","location":"Virtual Event Israel","acronym":"WSDM '21","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data","SIGIR ACM Special Interest Group on Information Retrieval"]},"container-title":["Proceedings of the 14th ACM International Conference on Web Search and Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3437963.3441810","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3437963.3441810","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T20:47:36Z","timestamp":1750193256000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3437963.3441810"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,3,8]]},"references-count":58,"alternative-id":["10.1145\/3437963.3441810","10.1145\/3437963"],"URL":"https:\/\/doi.org\/10.1145\/3437963.3441810","relation":{},"subject":[],"published":{"date-parts":[[2021,3,8]]},"assertion":[{"value":"2021-03-08","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}