{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,8,4]],"date-time":"2024-08-04T00:05:37Z","timestamp":1722729937317},"reference-count":46,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2020,4,4]],"date-time":"2020-04-04T00:00:00Z","timestamp":1585958400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,4,4]],"date-time":"2020-04-04T00:00:00Z","timestamp":1585958400000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Data Sci Anal"],"published-print":{"date-parts":[[2020,9]]},"DOI":"10.1007\/s41060-020-00209-1","type":"journal-article","created":{"date-parts":[[2020,4,4]],"date-time":"2020-04-04T05:32:54Z","timestamp":1585978374000},"page":"215-231","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["Combining instance and feature neighbours for extreme multi-label classification"],"prefix":"10.1007","volume":"10","author":[{"given":"Len","family":"Feremans","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Boris","family":"Cule","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Celine","family":"Vens","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bart","family":"Goethals","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2020,4,4]]},"reference":[{"key":"209_CR1","doi-asserted-by":"crossref","unstructured":"Feremans, L., Cule, B., Vens, C., Goethals, B.: Combining instance and feature neighbors for efficient multi-label classification. In: 2017 IEEE International Conference on Data Science and Advanced Analytics (DSAA), pp. 109\u2013118. IEEE (2017)","DOI":"10.1109\/DSAA.2017.70"},{"issue":"3","key":"209_CR2","doi-asserted-by":"publisher","first-page":"1","DOI":"10.4018\/jdwm.2007070101","volume":"3","author":"G Tsoumakas","year":"2006","unstructured":"Tsoumakas, G., Katakis, I.: Multi-label classification: an overview. Int. J. Data Warehous. Min. 3(3), 1\u201313 (2006)","journal-title":"Int. J. Data Warehous. Min."},{"issue":"3","key":"209_CR3","doi-asserted-by":"publisher","first-page":"333","DOI":"10.1007\/s10994-011-5256-5","volume":"85","author":"J Read","year":"2011","unstructured":"Read, J., Pfahringer, B., Holmes, G., Frank, E.: Classifier chains for multi-label classification. Mach. Learn. 85(3), 333\u2013359 (2011)","journal-title":"Mach. Learn."},{"issue":"3","key":"209_CR4","doi-asserted-by":"publisher","first-page":"297","DOI":"10.1023\/A:1007614523901","volume":"37","author":"RE Schapire","year":"1999","unstructured":"Schapire, R.E., Singer, Y.: Improved boosting algorithms using confidence-rated predictions. Mach. Learn. 37(3), 297\u2013336 (1999)","journal-title":"Mach. Learn."},{"issue":"2","key":"209_CR5","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1007\/s10994-008-5077-3","volume":"73","author":"C Vens","year":"2008","unstructured":"Vens, C., Struyf, J., Schietgat, L., D\u017eeroski, S., Blockeel, H.: Decision trees for hierarchical multi-label classification. Mach. Learn. 73(2), 185\u2013214 (2008)","journal-title":"Mach. Learn."},{"key":"209_CR6","doi-asserted-by":"crossref","unstructured":"Elisseeff, A., Weston, J., et\u00a0al.: A kernel method for multi-labelled classification. In: NIPS, vol.\u00a014, pp. 681\u2013687 (2001)","DOI":"10.7551\/mitpress\/1120.003.0092"},{"issue":"7","key":"209_CR7","doi-asserted-by":"publisher","first-page":"2038","DOI":"10.1016\/j.patcog.2006.12.019","volume":"40","author":"M-L Zhang","year":"2007","unstructured":"Zhang, M.-L., Zhou, Z.-H.: Ml-knn: a lazy learning approach to multi-label learning. Pattern Recognit. 40(7), 2038\u20132048 (2007)","journal-title":"Pattern Recognit."},{"issue":"6","key":"209_CR8","doi-asserted-by":"publisher","first-page":"411","DOI":"10.1002\/widm.1139","volume":"4","author":"E Gibaja","year":"2014","unstructured":"Gibaja, E., Ventura, S.: Multi-label learning: a review of the state of the art and ongoing research. Wiley Interdiscip. Rev. Data Min. Knowl. Discov. 4(6), 411\u2013444 (2014)","journal-title":"Wiley Interdiscip. Rev. Data Min. Knowl. Discov."},{"key":"209_CR9","unstructured":"Bhatia, K., Jain, H., Kar, P., Varma, M., Jain, P.: Sparse local embeddings for extreme multi-label classification. In: Advances in Neural Information Processing Systems, pp. 730\u2013738 (2015)"},{"key":"209_CR10","doi-asserted-by":"crossref","unstructured":"Tagami, Y.: Annexml: approximate nearest neighbor search for extreme multi-label classification. In: Proceedings of the 23rd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 455\u2013464. ACM (2017)","DOI":"10.1145\/3097983.3097987"},{"key":"209_CR11","doi-asserted-by":"crossref","unstructured":"Prabhu, Y., Varma, M.: Fastxml: a fast, accurate and stable tree-classifier for extreme multi-label learning. In: Proceedings of the 20th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 263\u2013272. ACM (2014)","DOI":"10.1145\/2623330.2623651"},{"key":"209_CR12","doi-asserted-by":"crossref","unstructured":"Resnick, P., Iacovou, N., Suchak, M., Bergstrom, P., Riedl, J.: Grouplens: an open architecture for collaborative filtering of netnews. In: Proceedings of the 1994 ACM Conference on Computer Supported Cooperative Work, pp. 175\u2013186. ACM (1994)","DOI":"10.1145\/192844.192905"},{"key":"209_CR13","unstructured":"Breese, J.S., Heckerman, D., Kadie, C.: Empirical analysis of predictive algorithms for collaborative filtering. In: Proceedings of the Fourteenth Conference on Uncertainty in Artificial Intelligence, pp. 43\u201352. Morgan Kaufmann Publishers Inc. (1998)"},{"key":"209_CR14","doi-asserted-by":"crossref","unstructured":"Sarwar, B., Karypis, G., Konstan, J., Riedl, J.: Item-based collaborative filtering recommendation algorithms. In: Proceedings of the 10th International Conference on World Wide Web, pp. 285\u2013295. ACM (2001)","DOI":"10.1145\/371920.372071"},{"key":"209_CR15","doi-asserted-by":"crossref","unstructured":"Bayardo, R.J., Ma, Y., Srikant, R.: Scaling up all pairs similarity search. In: Proceedings of the 16th International Conference on World Wide Web, pp. 131\u2013140. ACM (2007)","DOI":"10.1145\/1242572.1242591"},{"key":"209_CR16","unstructured":"Awekar, A., Samatova, N.F.: Fast matching for all pairs similarity search. In: IEEE\/WIC\/ACM International Joint Conferences on Web Intelligence and Intelligent Agent Technologies, 2009. WI-IAT\u201909, vol. 1, pp. 295\u2013300. IEEE (2009)"},{"key":"209_CR17","unstructured":"Xiao, C., Wang, W., Lin, X., Shang, H.: Top-k set similarity joins. In: IEEE 25th International Conference on Data Engineering, 2009. ICDE\u201909, pp. 916\u2013927. IEEE (2009)"},{"key":"209_CR18","doi-asserted-by":"crossref","unstructured":"Anastasiu, D.C., Karypis, G.: Fast parallel cosine k-nearest neighbor graph construction. In: Proceedings of the Sixth Workshop on Irregular Applications: Architectures and Algorithms, pp. 50\u201353. IEEE Press (2016)","DOI":"10.1109\/IA3.2016.013"},{"issue":"4","key":"209_CR19","doi-asserted-by":"publisher","first-page":"614","DOI":"10.1016\/S0022-0000(03)00026-6","volume":"66","author":"R Fagin","year":"2003","unstructured":"Fagin, R., Lotem, A., Naor, M.: Optimal aggregation algorithms for middleware. J. Comput. Syst. Sci. 66(4), 614\u2013656 (2003)","journal-title":"J. Comput. Syst. Sci."},{"key":"209_CR20","doi-asserted-by":"crossref","unstructured":"Ding, S., Suel, T.: Faster top-k document retrieval using block-max indexes. In: Proceedings of the 34th International ACM SIGIR Conference on Research and Development in Information Retrieval, pp. 993\u20131002. ACM (2011)","DOI":"10.1145\/2009916.2010048"},{"issue":"12","key":"209_CR21","doi-asserted-by":"publisher","first-page":"1213","DOI":"10.14778\/3402755.3402756","volume":"4","author":"M Fontoura","year":"2011","unstructured":"Fontoura, M., Josifovski, V., Liu, J., Venkatesan, S., Zhu, X., Zien, J.: Evaluation strategies for top-k queries over memory-resident inverted indexes. Proc. VLDB Endow. 4(12), 1213\u20131224 (2011)","journal-title":"Proc. VLDB Endow."},{"key":"209_CR22","doi-asserted-by":"crossref","unstructured":"Broder, A.Z., Carmel, D., Herscovici, M., Soffer, A., Zien, J.: Efficient query evaluation using a two-level retrieval process. In: Proceedings of the Twelfth International Conference on Information and Knowledge Management, pp. 426\u2013434. ACM (2003)","DOI":"10.1145\/956863.956944"},{"issue":"2\u20133","key":"209_CR23","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s10994-009-5127-5","volume":"76","author":"W Cheng","year":"2009","unstructured":"Cheng, W., H\u00fcllermeier, E.: Combining instance-based learning and logistic regression for multilabel classification. Mach. Learn. 76(2\u20133), 211\u2013225 (2009)","journal-title":"Mach. Learn."},{"key":"209_CR24","doi-asserted-by":"crossref","unstructured":"Wang, J., De\u00a0Vries, A.P., Reinders, M.J.: Unifying user-based and item-based collaborative filtering approaches by similarity fusion. In: Proceedings of the 29th Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, pp. 501\u2013508. ACM (2006)","DOI":"10.1145\/1148170.1148257"},{"key":"209_CR25","unstructured":"Liu, Y.: Crafting concurrent data structures, Ph.D. dissertation, Lehigh University (2015)"},{"key":"209_CR26","doi-asserted-by":"crossref","unstructured":"Spyromitros, E., Tsoumakas, G., Vlahavas, I.: An empirical study of lazy multilabel classification algorithms. In: Hellenic Conference on Artificial Intelligence, pp. 401\u2013406. Springer (2008)","DOI":"10.1007\/978-3-540-87881-0_40"},{"key":"209_CR27","doi-asserted-by":"crossref","unstructured":"Verstrepen, K., Goethals, B.: Unifying nearest neighbors collaborative filtering. In: Proceedings of the 8th ACM Conference on Recommender Systems, pp. 177\u2013184. ACM (2014)","DOI":"10.1145\/2645710.2645731"},{"key":"209_CR28","doi-asserted-by":"publisher","first-page":"170","DOI":"10.1016\/j.patcog.2016.02.017","volume":"56","author":"I Triguero","year":"2016","unstructured":"Triguero, I., Vens, C.: Labelling strategies for hierarchical multi-label classification techniques. Pattern Recognit. 56, 170\u2013183 (2016)","journal-title":"Pattern Recognit."},{"key":"209_CR29","doi-asserted-by":"crossref","unstructured":"Yang, Y.: A study of thresholding strategies for text categorization. In: Proceedings of the 24th Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, pp. 137\u2013145. ACM (2001)","DOI":"10.1145\/383952.383975"},{"key":"209_CR30","doi-asserted-by":"crossref","unstructured":"Draszawka, K., Szyma\u0144ski, J.: Thresholding strategies for large scale multi-label text classifier. In: 2013 6th International Conference on Human System Interactions (HSI), pp. 350\u2013355. IEEE (2013)","DOI":"10.1109\/HSI.2013.6577846"},{"issue":"Jul","key":"209_CR31","first-page":"2411","volume":"12","author":"G Tsoumakas","year":"2011","unstructured":"Tsoumakas, G., Spyromitros-Xioufis, E., Vilcek, J., Vlahavas, I.: Mulan: a java library for multi-label learning. J. Mach. Learn. Res. 12(Jul), 2411\u20132414 (2011)","journal-title":"J. Mach. Learn. Res."},{"issue":"1","key":"209_CR32","first-page":"667","volume":"17","author":"J Read","year":"2016","unstructured":"Read, J., Reutemann, P., Pfahringer, B., Holmes, G.: Meka: a multi-label\/multi-target extension to weka. J. Mach. Learn. Res. 17(1), 667\u2013671 (2016)","journal-title":"J. Mach. Learn. Res."},{"key":"209_CR33","unstructured":"Bhatia, K., Dahiya, K., Jain, H., Prabhu, Y., Varma, M.: The extreme classification repository: multi-label datasets & code (2016). http:\/\/manikvarma.org\/downloads\/XC\/XMLRepository.html. Accessed 13 Dec 2019"},{"key":"209_CR34","unstructured":"Partalas, I., Kosmopoulos, A., Baskiotis, N., Artieres, T., Paliouras, G., Gaussier, E., Androutsopoulos, I., Amini, M.-R., Galinari, P.: Lshtc: A benchmark for large-scale text classification (2015). arXiv:1503.08581"},{"key":"209_CR35","unstructured":"Zeng, Z.-Q., et al.: Fast training support vector machines using parallel sequential minimal optimization. In: 2008 3rd International Conference on Intelligent System and Knowledge Engineering, vol. 1. IEEE (2008)"},{"key":"209_CR36","unstructured":"Read, J., Pfahringer, B., Holmes, G.: Multi-label classification using ensembles of pruned sets. In: Eighth IEEE International Conference on Data Mining, 2008. ICDM\u201908, pp. 995\u20131000. IEEE (2008)"},{"key":"209_CR37","doi-asserted-by":"crossref","unstructured":"Jain, H., Prabhu, Y., Varma, M.: Extreme multi-label loss functions for recommendation, tagging, ranking & other missing label applications. In: Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 935\u2013944. ACM (2016)","DOI":"10.1145\/2939672.2939756"},{"key":"209_CR38","unstructured":"Younes, Z., Abdallah, F., Den\u0153ux, T.: Multi-label classification algorithm derived from k-nearest neighbor rule with label dependencies. In: Signal Processing Conference, 2008 16th European, vol. 2008, pp. 1\u20135. IEEE (2008)"},{"key":"209_CR39","unstructured":"Wang, X.-l., Zhao, H., Lu, B.: Enhanced k-nearest neighbour algorithm for large-scale hierarchical multi-label classification. In: Proceedings of the Joint ECML\/PKDD PASCAL Workshop on Large-Scale Hierarchical Classification, Athens, Greece, vol.\u00a05 (2011)"},{"key":"209_CR40","doi-asserted-by":"crossref","unstructured":"Partalas, I., Kosmopoulos, A., Baskiotis, N., Arti\u00e8res, T., Paliouras, G., Gaussier, \u00c9., Androutsopoulos, I., Amini, M., Gallinari, P.: LSHTC: a benchmark for large-scale text classification. CoRR, vol. arXiv:1503.08581 (2015)","DOI":"10.1145\/2556195.2556208"},{"key":"209_CR41","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla, N.V., Bowyer, K.W., Hall, L.O., Kegelmeyer, W.P.: Smote: synthetic minority over-sampling technique. J. Artif. Intell. Res. 16, 321\u2013357 (2002)","journal-title":"J. Artif. Intell. Res."},{"issue":"4","key":"209_CR42","doi-asserted-by":"publisher","first-page":"667","DOI":"10.1016\/j.eswa.2004.12.023","volume":"28","author":"S Tan","year":"2005","unstructured":"Tan, S.: Neighbor-weighted k-nearest neighbor for unbalanced text corpus. Expert Syst. Appl. 28(4), 667\u2013671 (2005)","journal-title":"Expert Syst. Appl."},{"key":"209_CR43","doi-asserted-by":"crossref","unstructured":"Liu, C., Cao, L., Philip, S.Y.: A hybrid coupled k-nearest neighbor algorithm on imbalance data. In: 2014 International Joint Conference on Neural Networks (IJCNN), pp. 2011\u20132018. IEEE (2014)","DOI":"10.1109\/IJCNN.2014.6889798"},{"issue":"1","key":"209_CR44","first-page":"1605","volume":"14","author":"RB Zadeh","year":"2013","unstructured":"Zadeh, R.B., Goel, A.: Dimension independent similarity computation. J. Mach. Learn. Res. 14(1), 1605\u20131626 (2013)","journal-title":"J. Mach. Learn. Res."},{"key":"209_CR45","unstructured":"Mikolov, T., Chen, K., Corrado, G., Dean, J.: Efficient estimation of word representations in vector space (2013). arXiv:1301.3781"},{"key":"209_CR46","unstructured":"Devlin, J., Chang, M.-W., Lee, K., Toutanova, K.: Bert: pre-training of deep bidirectional transformers for language understanding (2018). arXiv:1810.04805"}],"container-title":["International Journal of Data Science and Analytics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-020-00209-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s41060-020-00209-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-020-00209-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,3]],"date-time":"2024-08-03T12:07:45Z","timestamp":1722686865000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s41060-020-00209-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,4,4]]},"references-count":46,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2020,9]]}},"alternative-id":["209"],"URL":"https:\/\/doi.org\/10.1007\/s41060-020-00209-1","relation":{},"ISSN":["2364-415X","2364-4168"],"issn-type":[{"type":"print","value":"2364-415X"},{"type":"electronic","value":"2364-4168"}],"subject":[],"published":{"date-parts":[[2020,4,4]]},"assertion":[{"value":"5 December 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 March 2020","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 April 2020","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}