{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T09:57:21Z","timestamp":1773482241608,"version":"3.50.1"},"reference-count":44,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,11,28]],"date-time":"2025-11-28T00:00:00Z","timestamp":1764288000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,11,28]],"date-time":"2025-11-28T00:00:00Z","timestamp":1764288000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Data Sci Anal"],"published-print":{"date-parts":[[2026,6]]},"DOI":"10.1007\/s41060-025-00949-y","type":"journal-article","created":{"date-parts":[[2025,11,28]],"date-time":"2025-11-28T07:02:40Z","timestamp":1764313360000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Random feature embeddings give strong baselines for extreme multi-label text classification"],"prefix":"10.1007","volume":"21","author":[{"given":"Asha","family":"Rani","sequence":"first","affiliation":[]},{"given":"Rudra","family":"Dutt","sequence":"additional","affiliation":[]},{"given":"Yashaswi","family":"Verma","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,11,28]]},"reference":[{"key":"949_CR1","doi-asserted-by":"crossref","unstructured":"Agrawal, R., Gupta, A., Prabhu, Y., Varma, M.: Multi-label learning with millions of labels: Recommending advertiser bid phrases for web pages. In: International Conference on World Wide Web, pp. 13\u201324 (2013)","DOI":"10.1145\/2488388.2488391"},{"key":"949_CR2","doi-asserted-by":"crossref","unstructured":"Prabhu, Y., Varma, M.: FastXML: A fast, accurate and stable tree-classifier for extreme multi-label learning. In: ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 263\u2013272 (2014)","DOI":"10.1145\/2623330.2623651"},{"key":"949_CR3","doi-asserted-by":"crossref","unstructured":"Guillaumin, M., Mensink, T., Verbeek, J.J., Schmid, C.: Tagprop: Discriminative metric learning in nearest neighbor models for image auto-annotation. In: IEEE International Conference on Computer Vision, pp. 309\u2013316 (2009)","DOI":"10.1109\/ICCV.2009.5459266"},{"key":"949_CR4","doi-asserted-by":"crossref","unstructured":"Jain, H., Prabhu, Y., Varma, M.: Extreme multi-label loss functions for recommendation, tagging, ranking & other missing label applications. In: ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 935\u2013944 (2016)","DOI":"10.1145\/2939672.2939756"},{"key":"949_CR5","doi-asserted-by":"crossref","unstructured":"Prabhu, Y., Kag, A., Gopinath, S., Dahiya, K., Harsola, S., Agrawal, R., Varma, M.: Extreme multi-label learning with label features for warm-start tagging, ranking & recommendation. In: ACM International Conference on Web Search and Data Mining (2018)","DOI":"10.1145\/3159652.3159660"},{"key":"949_CR6","doi-asserted-by":"crossref","unstructured":"Prabhu, Y., Kag, A., Harsola, S., Agrawal, R., Varma, M.: Parabel: Partitioned label trees for extreme classification with application to dynamic search advertising. In: Proceedings of the International World Wide Web Conference (2018)","DOI":"10.1145\/3178876.3185998"},{"key":"949_CR7","unstructured":"Bhatia, K., Jain, H., Kar, P., Varma, M., Jain, P.: Sparse local embeddings for extreme multi-label classification. In: Neural Information Processing Systems, pp. 730\u2013738 (2015)"},{"key":"949_CR8","unstructured":"Yu, H.-F., Jain, P., Kar, P., Dhillon, I.S.: Large-scale multi-label learning with missing labels. In: International Conference on Machine Learning, vol. 32, pp. 593\u2013601 (2014)"},{"key":"949_CR9","doi-asserted-by":"crossref","unstructured":"Babbar, R., Sch\u00f6lkopf, B.: DiSMEC: Distributed sparse machines for extreme multi-label classification. In: ACM International Conference on Web Search and Data Mining, pp. 721\u2013729 (2017)","DOI":"10.1145\/3018661.3018741"},{"key":"949_CR10","unstructured":"Yen, I.E.-H., Huang, X., Ravikumar, P., Zhong, K., Dhillon, I.S.: PD-Sparse : A primal and dual sparse approach to extreme multiclass and multilabel classification. In: International Conference on Machine Learning, vol. 48, pp. 3069\u20133077 (2016)"},{"key":"949_CR11","doi-asserted-by":"crossref","unstructured":"Yen, I.E.-H., Huang, X., Dai, W., Ravikumar, P., Dhillon, I.S., Xing, E.P.: Ppdsparse: A parallel primal-dual sparse method for extreme classification. In: ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 545\u2013553 (2017)","DOI":"10.1145\/3097983.3098083"},{"key":"949_CR12","doi-asserted-by":"crossref","unstructured":"Tagami, Y.: AnnexML: Approximate nearest neighbor search for extreme multi-label classification. In: ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 455\u2013464 (2017)","DOI":"10.1145\/3097983.3097987"},{"key":"949_CR13","doi-asserted-by":"crossref","unstructured":"Liu, J., Chang, W.-C., Wu, Y., Yang, Y.: Deep learning for extreme multi-label text classification. In: Proceedings of the 40th International ACM SIGIR Conference on Research and Development in Information Retrieval (2017)","DOI":"10.1145\/3077136.3080834"},{"key":"949_CR14","doi-asserted-by":"crossref","unstructured":"Zhang, W., Yan, J., Wang, X., Zha, H.: Deep extreme multi-label learning. In: Proceedings of the International Conference on Multimedia Retrieval (2018)","DOI":"10.1145\/3206025.3206030"},{"issue":"11","key":"949_CR15","doi-asserted-by":"publisher","first-page":"2099","DOI":"10.1007\/s10994-020-05888-2","volume":"109","author":"S Khandagale","year":"2020","unstructured":"Khandagale, S., Xiao, H., Babbar, R.: Bonsai: diverse and shallow trees for extreme multi-label classification. Mach. Learn. 109(11), 2099\u20132119 (2020)","journal-title":"Mach. Learn."},{"key":"949_CR16","doi-asserted-by":"crossref","unstructured":"Chang, W., Yu, H., Zhong, K., Yang, Y., Dhillon, I.S.: Taming pretrained transformers for extreme multi-label text classification. In: SIGKDD Conference on Knowledge Discovery and Data Mining, pp. 3163\u20133171 (2020)","DOI":"10.1145\/3394486.3403368"},{"key":"949_CR17","unstructured":"You, R., Zhang, Z., Wang, Z., Dai, S., Mamitsuka, H., Zhu, S.: Attentionxml: Label tree-based attention-aware deep model for high-performance extreme multi-label text classification. In: Advances in Neural Information Processing Systems, pp. 5812\u20135822 (2019)"},{"key":"949_CR18","doi-asserted-by":"crossref","unstructured":"Dahiya, K., Saini, D., Mittal, A., Shaw, A., Dave, K., Soni, A., Jain, H., Agarwal, S., Varma, M.: Deepxml: A deep extreme multi-label learning framework applied to short text documents. In: International Conference on Web Search and Data Mining, pp. 31\u201339 (2021)","DOI":"10.1145\/3437963.3441810"},{"key":"949_CR19","unstructured":"Ye, H., Chen, Z., Wang, D., Davison, B.D.: Pretrained generalized autoregressive model with adaptive probabilistic label clusters for extreme multi-label text classification. In: International Conference on Machine Learning, vol. 119, pp. 10809\u201310819 (2020)"},{"key":"949_CR20","unstructured":"Jain, V., Prakash, J., Saini, D., Jiao, J., Ramjee, R., Varma, M.: Renee: End-to-end training of extreme classification models. In: Proceedings of Machine Learning and Systems (2023)"},{"key":"949_CR21","doi-asserted-by":"publisher","first-page":"189","DOI":"10.1090\/conm\/026\/737400","volume":"26","author":"WB Johnson","year":"1984","unstructured":"Johnson, W.B., Lindenstrauss, J.: Extensions of Lipschitz mappings into a Hilbert space. Contemp. Math. 26, 189\u2013206 (1984)","journal-title":"Contemp. Math."},{"key":"949_CR22","doi-asserted-by":"crossref","unstructured":"Verma, Y.: Surprising effectiveness of random feature embeddings in extreme classification. In: International Conference on Pattern Recognition, pp. 1836\u20131842 (2022)","DOI":"10.1109\/ICPR56361.2022.9956663"},{"key":"949_CR23","doi-asserted-by":"crossref","unstructured":"Xu, C., Tao, D., Xu, C.: Robust extreme multi-label learning. In: ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 1275\u20131284 (2016)","DOI":"10.1145\/2939672.2939798"},{"issue":"8\u20139","key":"949_CR24","doi-asserted-by":"publisher","first-page":"1329","DOI":"10.1007\/s10994-019-05791-5","volume":"108","author":"R Babbar","year":"2019","unstructured":"Babbar, R., Sch\u00f6lkopf, B.: Data scarcity, robustness and extreme multi-label classification. Mach. Learn. 108(8\u20139), 1329\u20131351 (2019)","journal-title":"Mach. Learn."},{"key":"949_CR25","unstructured":"Weston, J., Makadia, A., Yee, H.: Label partitioning for sublinear ranking. In: International Conference on Machine Learning (2013)"},{"key":"949_CR26","unstructured":"Siblini, W., Meyer, F., Kuntz, P.: CRAFTML: An efficient clustering-based random forest for extreme multi-label learning. In: Dy, J.G., Krause, A. (eds.) International Conference on Machine Learning (2018)"},{"key":"949_CR27","doi-asserted-by":"crossref","unstructured":"Jain, H., Balasubramanian, V., Chunduri, B., Varma, M.: Slice: Scalable linear extreme classifiers trained on 100 million labels for related searches. In: International Conference on Web Search and Data Mining, pp. 528\u2013536 (2019)","DOI":"10.1145\/3289600.3290979"},{"key":"949_CR28","unstructured":"Kharbanda, S., Banerjee, A., Schultheis, E., Babbar, R.: CascadeXML: Rethinking transformers for end-to-end multi-resolution training in extreme multi-label classification. In: Advances in Neural Information Processing Systems (2022)"},{"key":"949_CR29","doi-asserted-by":"crossref","unstructured":"Jalan, A., Kar, P.: Accelerating extreme classification via adaptive feature agglomeration. In: International Joint Conference on Artificial Intelligence (2019)","DOI":"10.24963\/ijcai.2019\/361"},{"key":"949_CR30","unstructured":"Jasinska, K., Dembczynski, K., Busa-Fekete, R., Pfannschmidt, K., Klerx, T., H\u00fcllermeier, E.: Extreme F-measure maximization using sparse probability estimates. In: International Conference on Machine Learning (2016)"},{"key":"949_CR31","unstructured":"Yang, Z., Dai, Z., Yang, Y., Carbonell, J., Salakhutdinov, R.R., Le, Q.V.: XLNet: Generalized autoregressive pretraining for language understanding. In: Advances in Neural Information Processing Systems (2019)"},{"key":"949_CR32","doi-asserted-by":"crossref","unstructured":"Devlin, J., Chang, M.-W., Lee, K., Toutanova, K.: BERT: Pre-training of deep bidirectional transformers for language understanding. In: NAACL, pp. 4171\u20134186 (2019)","DOI":"10.18653\/v1\/N19-1423"},{"key":"949_CR33","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-21606-5","volume-title":"The Elements of Statistical Learning","author":"T Hastie","year":"2001","unstructured":"Hastie, T., Tibshirani, R., Friedman, J.: The Elements of Statistical Learning. Springer Series in Statistics. Springer, New York, NY, USA (2001)"},{"issue":"5","key":"949_CR34","doi-asserted-by":"publisher","first-page":"2580","DOI":"10.1137\/100804139","volume":"33","author":"N Halko","year":"2011","unstructured":"Halko, N., Martinsson, P.-G., Shkolnisky, Y., Tygert, M.: An algorithm for the principal component analysis of large data sets. SIAM J. Scientific Computing 33(5), 2580\u20132594 (2011)","journal-title":"SIAM J. Scientific Computing"},{"key":"949_CR35","doi-asserted-by":"crossref","unstructured":"Yu, W., Gu, Y., Li, J., Liu, S., Li, Y.: Single-pass PCA of large high-dimensional data. CoRR abs\/1704.07669 (2017)","DOI":"10.24963\/ijcai.2017\/468"},{"key":"949_CR36","unstructured":"Fern, X.Z., Brodley, C.E.: Random projection for high dimensional data clustering: A cluster ensemble approach. In: International Conference on Machine Learning, pp. 186\u2013193 (2003)"},{"key":"949_CR37","unstructured":"Dasgupta, S.: Experiments with random projection. In: Uncertainty in Artificial Intelligence, pp. 143\u2013151 (2000)"},{"key":"949_CR38","unstructured":"Lecture 6 (CPSC 536N: Randomized Algorithms; 2011-12 Term 2. https:\/\/www.cs.ubc.ca\/~nickhar\/W12\/Lecture6Notes.pdf. Accessed: 2019-09-01"},{"key":"949_CR39","doi-asserted-by":"crossref","unstructured":"Perronnin, F., S\u00e1nchez, J., Mensink, T.: Improving the fisher kernel for large-scale image classification. In: European Conference on Computer Vision (2010)","DOI":"10.1007\/978-3-642-15561-1_11"},{"key":"949_CR40","unstructured":"Jayaram\u00a0Subramanya, S., Devvrit, F., Simhadri, H.V., Krishnawamy, R., Kadekodi, R.: DiskANN: Fast accurate billion-point nearest neighbor search on a single node. In: Advances in Neural Information Processing Systems (2019)"},{"key":"949_CR41","doi-asserted-by":"crossref","unstructured":"Feng, S.L., Manmatha, R., Lavrenko, V.: Multiple bernoulli relevance models for image and video annotation. In: Proc. CVPR, pp. 1002\u20131009 (2004)","DOI":"10.1109\/CVPR.2004.1315274"},{"key":"949_CR42","doi-asserted-by":"publisher","first-page":"126","DOI":"10.1007\/s11263-016-0927-0","volume":"121","author":"Y Verma","year":"2017","unstructured":"Verma, Y., Jawahar, C.V.: Image annotation by propagating labels from semantic neighbourhoods. Int. J. Comput. Vision 121, 126\u2013148 (2017)","journal-title":"Int. J. Comput. Vision"},{"key":"949_CR43","unstructured":"Bhatia, K., Jain, H., Prabhu, Y., Varma, M.: The Extreme Classification Repository (2016). http:\/\/manikvarma.github.io\/downloads\/XC\/XMLRepository.html"},{"key":"949_CR44","unstructured":"Wydmuch, M., Jasinska, K., Kuznetsov, M., Busa-Fekete, R., Dembczynski, K.: A no-regret generalization of hierarchical softmax to extreme multi-label classification. In: Advances in Neural Information Processing Systems (2018)"}],"container-title":["International Journal of Data Science and Analytics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-025-00949-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s41060-025-00949-y","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-025-00949-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T09:37:01Z","timestamp":1773481021000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s41060-025-00949-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,11,28]]},"references-count":44,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,6]]}},"alternative-id":["949"],"URL":"https:\/\/doi.org\/10.1007\/s41060-025-00949-y","relation":{},"ISSN":["2364-415X","2364-4168"],"issn-type":[{"value":"2364-415X","type":"print"},{"value":"2364-4168","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,11,28]]},"assertion":[{"value":"19 April 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 August 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 November 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest except IIT Jodhpur (.iitj.ac.in).","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"This work does not involve any human or animal subjects; hence, no ethics approval\/consent is required.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}}],"article-number":"27"}}