{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,19]],"date-time":"2026-03-19T06:13:00Z","timestamp":1773900780624,"version":"3.50.1"},"reference-count":58,"publisher":"Springer Science and Business Media LLC","issue":"14","license":[{"start":{"date-parts":[[2021,3,10]],"date-time":"2021-03-10T00:00:00Z","timestamp":1615334400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,3,10]],"date-time":"2021-03-10T00:00:00Z","timestamp":1615334400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2021,6]]},"DOI":"10.1007\/s11042-021-10612-w","type":"journal-article","created":{"date-parts":[[2021,3,10]],"date-time":"2021-03-10T20:02:48Z","timestamp":1615406568000},"page":"20821-20847","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":18,"title":["Bag-of-Visual-Words codebook generation using deep features for effective classification of imbalanced multi-class image datasets"],"prefix":"10.1007","volume":"80","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-4807-6787","authenticated-orcid":false,"given":"Manisha","family":"Saini","sequence":"first","affiliation":[]},{"given":"Seba","family":"Susan","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,3,10]]},"reference":[{"key":"10612_CR1","unstructured":"Abadi M, Barham P, Chen J, Chen Z, Davis A, Dean J, ... & Kudlur M (2016). Tensorflow: A system for large-scale machine learning. In 12th {USENIX} symposium on operating systems design and implementation ({OSDI} 16) (pp. 265\u2013283)."},{"key":"10612_CR2","unstructured":"Bellet A, Habrard A, Sebban M (2013) A survey on metric learning for feature vectors and structured data. arXiv preprint arXiv:1306.6709"},{"issue":"1","key":"10612_CR3","doi-asserted-by":"publisher","first-page":"1","DOI":"10.2200\/S00626ED1V01Y201501AIM030","volume":"9","author":"A Bellet","year":"2015","unstructured":"Bellet A, Habrard A, Sebban M (2015) Metric learning. Synthesis Lectures on Artificial Intelligence and Machine Learning 9(1):1\u2013151","journal-title":"Synthesis Lectures on Artificial Intelligence and Machine Learning"},{"key":"10612_CR4","doi-asserted-by":"crossref","unstructured":"Bosch A, Zisserman A, Munoz X (2007, October) Image classification using random forests and ferns. In 2007 IEEE 11th international conference on computer vision (pp. 1-8). IEEE.","DOI":"10.1109\/ICCV.2007.4409066"},{"key":"10612_CR5","unstructured":"Brendel W, Bethge M (2019) Approximating cnns with bag-of-local-features models works surprisingly well on imagenet. arXiv preprint arXiv:1904.00760"},{"key":"10612_CR6","doi-asserted-by":"publisher","first-page":"249","DOI":"10.1016\/j.neunet.2018.07.011","volume":"106","author":"M Buda","year":"2018","unstructured":"Buda M, Maki A, Mazurowski MA (2018) A systematic study of the class imbalance problem in convolutional neural networks. Neural Netw 106:249\u2013259","journal-title":"Neural Netw"},{"key":"10612_CR7","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla NV, Bowyer KW, Hall LO, Kegelmeyer WP (2002) SMOTE: synthetic minority over-sampling technique. J Artif Intell Res 16:321\u2013357","journal-title":"J Artif Intell Res"},{"issue":"10","key":"10612_CR8","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1109\/LGRS.2017.2731997","volume":"14","author":"G Cheng","year":"2017","unstructured":"Cheng G, Li Z, Yao X, Guo L, Wei Z (2017) Remote sensing image scene classification using bag of convolutional features. IEEE Geosci Remote Sens Lett 14(10):1735\u20131739","journal-title":"IEEE Geosci Remote Sens Lett"},{"key":"10612_CR9","unstructured":"Convolutional Neural Networks (CNNs \/ ConvNets) (2019) The Stanford CS class notes, Spring 2019 Assignments, http:\/\/cs231n.github.io\/convolutional-networks\/, Accessed 28 August 2020."},{"issue":"3","key":"10612_CR10","first-page":"273","volume":"20","author":"C Cortes","year":"1995","unstructured":"Cortes C, Vapnik V (1995) Support-vector networks. Mach Learn 20(3):273\u2013297","journal-title":"Mach Learn"},{"key":"10612_CR11","doi-asserted-by":"crossref","unstructured":"Deng J, Dong W, Socher R, Li LJ, Li K, Fei-Fei L (2009) Imagenet: a large-scale hierarchical image database. In 2009 IEEE conference on computer vision and pattern recognition (pp. 248-255). IEEE","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"10612_CR12","doi-asserted-by":"crossref","unstructured":"Deselaers, T., Pimenidis, L., & Ney, H. (2008, December). Bag-of-visual-words models for adult image classification and filtering. In 2008 19th International Conference on Pattern Recognition (pp. 1-4). IEEE.","DOI":"10.1109\/ICPR.2008.4761366"},{"key":"10612_CR13","unstructured":"Dittman DJ, Khoshgoftaar TM, Wald R, Napolitano A (2014, May). Comparison of data sampling approaches for imbalanced bioinformatics data. In The twenty-seventh international FLAIRS conference."},{"key":"10612_CR14","doi-asserted-by":"crossref","unstructured":"Eitrich T, Lang B (2006) Efficient optimization of support vector machine learning parameters for unbalanced datasets. J Comput Appl Math 196(2):425\u2013436","DOI":"10.1016\/j.cam.2005.09.009"},{"issue":"1","key":"10612_CR15","doi-asserted-by":"publisher","first-page":"18","DOI":"10.1111\/j.0824-7935.2004.t01-1-00228.x","volume":"20","author":"A Estabrooks","year":"2004","unstructured":"Estabrooks A, Jo T, Japkowicz N (2004) A multiple resampling method for learning from imbalanced data sets. Comput Intell 20(1):18\u201336","journal-title":"Comput Intell"},{"key":"10612_CR16","first-page":"1","volume":"2017","author":"J Feng","year":"2017","unstructured":"Feng J, Liu Y, Wu L (2017) Bag of visual words model with deep spatial features for geographical scene classification. Computational intelligence and neuroscience 2017:1\u201314","journal-title":"Computational intelligence and neuroscience"},{"key":"10612_CR17","doi-asserted-by":"publisher","first-page":"64827","DOI":"10.1109\/ACCESS.2019.2917266","volume":"7","author":"MI Georgescu","year":"2019","unstructured":"Georgescu MI, Ionescu RT, Popescu M (2019) Local learning with deep and handcrafted features for facial expression recognition. IEEE Access 7:64827\u201364836","journal-title":"IEEE Access"},{"key":"10612_CR18","volume-title":"Hands-on machine learning with Scikit-learn, Keras, and TensorFlow: concepts, tools, and techniques to build intelligent systems","author":"A G\u00e9ron","year":"2019","unstructured":"G\u00e9ron A (2019) Hands-on machine learning with Scikit-learn, Keras, and TensorFlow: concepts, tools, and techniques to build intelligent systems. O'Reilly Media"},{"issue":"1","key":"10612_CR19","doi-asserted-by":"publisher","first-page":"100","DOI":"10.1016\/S0734-189X(85)90153-7","volume":"29","author":"RM Haralick","year":"1985","unstructured":"Haralick RM, Shapiro LG (1985) Image segmentation techniques. Computer vision, graphics, and image processing 29(1):100\u2013132","journal-title":"Computer vision, graphics, and image processing"},{"key":"10612_CR20","unstructured":"He H, Bai Y, Garcia EA Li S (2008) ADASYN: adaptive synthetic sampling approach for imbalanced learning. In 2008 IEEE international joint conference on neural networks (IEEE world congress on computational intelligence) pp 1322\u20131328 IEEE"},{"key":"10612_CR21","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016). Deep residual learning for image recognition. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 770-778).","DOI":"10.1109\/CVPR.2016.90"},{"key":"10612_CR22","doi-asserted-by":"crossref","unstructured":"Hou Q, Cheng MM, Hu X, Borji A, Tu Z, Torr PH (2017) Deeply supervised salient object detection with short connections. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition pp 3203\u20133212","DOI":"10.1109\/CVPR.2017.563"},{"issue":"1","key":"10612_CR23","first-page":"46","volume":"1","author":"SB Kotsiantis","year":"2003","unstructured":"Kotsiantis SB, Pintelas PE (2003) Mixture of expert agents for handling imbalanced data sets. Annals of Mathematics, Computing & Teleinformatics 1(1):46\u201355","journal-title":"Annals of Mathematics, Computing & Teleinformatics"},{"key":"10612_CR24","unstructured":"Kumar MD, Babaie M, Zhu S, Kalra S, Tizhoosh HR (2017) A comparative study of CNN, BoVW and LBP for classification of histopathological images. In 2017 IEEE Symposium Series on Computational Intelligence (SSCI) pp 1\u20137. IEEE"},{"key":"10612_CR25","unstructured":"Lessmann S (2004) Solving imbalanced classification problems with support vector machines. In IC-AI 4:214\u2013220"},{"key":"10612_CR26","unstructured":"Li P, Samorodnitsk G, Hopcroft J (2013) Sign cauchy projections and chi-square kernel. In Advances in Neural Information Processing Systems pp 2571\u20132579"},{"key":"10612_CR27","doi-asserted-by":"publisher","first-page":"113","DOI":"10.1016\/j.ins.2013.07.007","volume":"250","author":"V L\u00f3pez","year":"2013","unstructured":"L\u00f3pez V, Fern\u00e1ndez A, Garc\u00eda S, Palade V, Herrera F (2013) An insight into classification with imbalanced data: empirical results and current trends on using data intrinsic characteristics. Inf Sci 250:113\u2013141","journal-title":"Inf Sci"},{"key":"10612_CR28","doi-asserted-by":"crossref","unstructured":"Mahmood A, Bennamoun M, An S, Sohel F (2017) Resfeats: residual network based features for image classification. In 2017 IEEE international conference on image processing (ICIP) pp 1597\u20131601 IEEE","DOI":"10.1109\/ICIP.2017.8296551"},{"key":"10612_CR29","doi-asserted-by":"crossref","unstructured":"Okafor E, Pawara P, Karaaba F, Surinta O, Codreanu V, Schomaker L, Wiering M (2016, December). Comparative study between deep learning and bag of visual words for wild-animal recognition. In 2016 IEEE Symposium Series on Computational Intelligence (SSCI) (pp. 1-8). IEEE.","DOI":"10.1109\/SSCI.2016.7850111"},{"key":"10612_CR30","doi-asserted-by":"crossref","unstructured":"Opelt A, Fussenegger M, Pinz A, Auer P (2004) Weak hypotheses and boosting for generic object detection and recognition. In European conference on computer vision Springer, Berlin, Heidelberg pp. 71\u201384","DOI":"10.1007\/978-3-540-24671-8_6"},{"issue":"1","key":"10612_CR31","doi-asserted-by":"publisher","first-page":"58","DOI":"10.1504\/IJAIP.2017.081179","volume":"9","author":"RJ Oskouei","year":"2017","unstructured":"Oskouei RJ, Bigham BS (2017) Over-sampling via under-sampling in strongly imbalanced data. International Journal of Advanced Intelligence Paradigms 9(1):58\u201366","journal-title":"International Journal of Advanced Intelligence Paradigms"},{"key":"10612_CR32","unstructured":"Pedregosa F, Varoquaux G, Gramfort A, Michel V, Thirion B, Grisel O, Vanderplas J (2011) Scikit-learn: Machine learning in Python. the Journal of machine Learning research, 12:2825\u20132830"},{"key":"10612_CR33","volume-title":"Evaluation: from precision, recall and F-measure to ROC, informedness, markedness and correlation","author":"DM Powers","year":"2011","unstructured":"Powers DM (2011) Evaluation: from precision, recall and F-measure to ROC, informedness, markedness and correlation"},{"key":"10612_CR34","unstructured":"Provost F (2000) Machine learning from imbalanced data sets 101. In Proceedings of the AAAI\u20192000 workshop on imbalanced data sets 68(2000):1\u20133 AAAI press"},{"key":"10612_CR35","unstructured":"Rahimi A, Recht B (2008) Random features for large-scale kernel machines. In Advances in neural information processing systems pp. 1177\u20131184"},{"key":"10612_CR36","doi-asserted-by":"publisher","first-page":"164","DOI":"10.1016\/j.patcog.2016.03.012","volume":"57","author":"JA S\u00e1ez","year":"2016","unstructured":"S\u00e1ez JA, Krawczyk B, Wo\u017aniak M (2016) Analyzing the over-sampling of different classes and types of examples in multi-class imbalanced datasets. Pattern Recogn 57:164\u2013178","journal-title":"Pattern Recogn"},{"key":"10612_CR37","doi-asserted-by":"crossref","unstructured":"Saini M, Susan S (2018) Comparison of deep learning, data augmentation and bag of-visual-words for classification of imbalanced image datasets. In International Conference on Recent Trends in Image Processing and Pattern Recognition Springer, Singapore pp. 561\u2013571","DOI":"10.1007\/978-981-13-9181-1_49"},{"key":"10612_CR38","doi-asserted-by":"crossref","unstructured":"Saini M, Susan S (2019) Data augmentation of minority class with transfer learning for classification of imbalanced breast Cancer dataset using inception-V3. In Iberian Conference on Pattern Recognition and Image Analysis Springer, Cham pp. 409\u2013420","DOI":"10.1007\/978-3-030-31332-6_36"},{"key":"10612_CR39","doi-asserted-by":"publisher","first-page":"106759","DOI":"10.1016\/j.asoc.2020.106759","volume":"97","author":"M Saini","year":"2020","unstructured":"Saini M, Susan S (2020) Deep transfer with minority data augmentation for imbalanced breast cancer dataset. Appl Soft Comput 97:106759","journal-title":"Appl Soft Comput"},{"key":"10612_CR40","doi-asserted-by":"crossref","unstructured":"Sculley D (2010) Web-scale k-means clustering. In Proceedings of the 19th international conference on World wide web pp. 1177\u20131178","DOI":"10.1145\/1772690.1772862"},{"issue":"5","key":"10612_CR41","doi-asserted-by":"publisher","first-page":"1285","DOI":"10.1109\/TMI.2016.2528162","volume":"35","author":"HC Shin","year":"2016","unstructured":"Shin HC, Roth HR, Gao M, Lu L, Xu Z, Nogues I, Yao J, Mollura D, Summers RM (2016) Deep convolutional neural networks for computer-aided detection: CNN architectures, dataset characteristics and transfer learning. IEEE Trans Med Imaging 35(5):1285\u20131298","journal-title":"IEEE Trans Med Imaging"},{"key":"10612_CR42","unstructured":"Simonyan K, Zisserman A (2014) Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556"},{"key":"10612_CR43","doi-asserted-by":"publisher","first-page":"210","DOI":"10.1016\/j.biosystemseng.2017.11.015","volume":"166","author":"HK Suh","year":"2018","unstructured":"Suh HK, Hofstee JW, IJsselmuiden J, van Henten EJ (2018) Sugar beet and volunteer potato classification using Bag-of-Visual-Words model, scale-invariant feature transform, or speeded up robust feature descriptors and crop row information. Biosyst Eng 166:210\u2013226","journal-title":"Biosyst Eng"},{"key":"10612_CR44","doi-asserted-by":"crossref","unstructured":"Susan S, Kumar A (2018, December). Hybrid of intelligent minority over-sampling and PSO-based intelligent majority under-sampling for learning from imbalanced datasets. In International Conference on Intelligent Systems Design and Applications (pp. 760-769). Springer, Cham.","DOI":"10.1007\/978-3-030-16660-1_74"},{"key":"10612_CR45","doi-asserted-by":"publisher","first-page":"141","DOI":"10.1016\/j.asoc.2019.02.028","volume":"78","author":"S Susan","year":"2019","unstructured":"Susan S, Kumar A (2019) SSOMaj-SMOTE-SSOMin: three-step intelligent pruning of majority and minority samples for learning from imbalanced datasets. Appl Soft Comput 78:141\u2013149","journal-title":"Appl Soft Comput"},{"issue":"11","key":"10612_CR46","doi-asserted-by":"publisher","first-page":"951","DOI":"10.1049\/iet-ipr.2014.0670","volume":"9","author":"S Susan","year":"2015","unstructured":"Susan S, Jain A, Sharma A, Verma S, Jain S (2015) Fuzzy match index for scale-invariant feature transform (SIFT) features with application to face recognition with weak supervision. IET Image Process 9(11):951\u2013958","journal-title":"IET Image Process"},{"key":"10612_CR47","doi-asserted-by":"crossref","unstructured":"Susan S, Sethi D, Arora K CW-CAE: pulmonary nodule detection from imbalanced dataset using class-weighted convolutional autoencoder. In International Conference on Innovative Computing and Communications (pp. 825-833). Springer. Singapore.","DOI":"10.1007\/978-981-15-5148-2_71"},{"key":"10612_CR48","doi-asserted-by":"crossref","unstructured":"Syarif, I., Prugel-Bennett, A., & Wills, G. (2012, April). Unsupervised clustering approach for network anomaly detection. In International conference on networked digital technologies (pp. 135-145). Springer, Berlin, Heidelberg.","DOI":"10.1007\/978-3-642-30507-8_13"},{"issue":"10","key":"10612_CR49","doi-asserted-by":"publisher","first-page":"3738","DOI":"10.1016\/j.patcog.2012.03.014","volume":"45","author":"MA Tahir","year":"2012","unstructured":"Tahir MA, Kittler J, Yan F (2012) Inverse random under sampling for class imbalance problem and its application to multi-label classification. Pattern Recogn 45(10):3738\u20133750","journal-title":"Pattern Recogn"},{"issue":"5","key":"10612_CR50","doi-asserted-by":"publisher","first-page":"1299","DOI":"10.1109\/TMI.2016.2535302","volume":"35","author":"N Tajbakhsh","year":"2016","unstructured":"Tajbakhsh N, Shin JY, Gurudu SR, Hurst RT, Kendall CB, Gotway MB, Liang J (2016) Convolutional neural networks for medical image analysis: full training or fine tuning? IEEE Trans Med Imaging 35(5):1299\u20131312","journal-title":"IEEE Trans Med Imaging"},{"key":"10612_CR51","unstructured":"Tang Y (2013) Deep learning using linear support vector machines. arXiv preprint arXiv:1306.0239"},{"key":"10612_CR52","unstructured":"Tax DM, Duin RP (2000) Feature scaling in support vector data descriptions. Learning from Imbalanced Datasets, 25\u201330"},{"key":"10612_CR53","volume-title":"January","author":"The TensorFlow Team","year":"2019","unstructured":"The TensorFlow Team (2019) January. Flowers, TensorFlow Datasets http:\/\/download.tensorflow.org\/example_images\/flower_photos.tgz"},{"key":"10612_CR54","first-page":"1","volume":"2018","author":"A Voulodimos","year":"2018","unstructured":"Voulodimos A, Doulamis N, Doulamis A, Protopapadakis E (2018) Deep learning for computer vision: a brief review. Computational intelligence and neuroscience 2018:1\u201313","journal-title":"Computational intelligence and neuroscience"},{"key":"10612_CR55","doi-asserted-by":"publisher","first-page":"42639","DOI":"10.1109\/ACCESS.2019.2907043","volume":"7","author":"XD Wang","year":"2019","unstructured":"Wang XD, Chen RC, Yan F, Zeng ZQ, Hong CQ (2019) Fast adaptive K-means subspace clustering for high-dimensional data. IEEE Access 7:42639\u201342651","journal-title":"IEEE Access"},{"key":"10612_CR56","unstructured":"Wang X, Zheng Z, He Y, Yan F, Zeng Z, Yang Y (2020) Progressive local filter pruning for image retrieval acceleration. arXiv preprint arXiv:2001.08878"},{"key":"10612_CR57","unstructured":"Xia X, Xu C, Nan B (2017) Inception-v3 for flower classification. In 2017 2nd International Conference on Image, Vision and Computing (ICIVC) pp. 783\u2013787 IEEE"},{"issue":"18","key":"10612_CR58","doi-asserted-by":"publisher","first-page":"3823","DOI":"10.1016\/j.neucom.2011.07.024","volume":"74","author":"H Yang","year":"2011","unstructured":"Yang H, Shao L, Zheng F, Wang L, Song Z (2011) Recent advances and trends in visual tracking: a review. Neurocomputing 74(18):3823\u20133831","journal-title":"Neurocomputing"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-021-10612-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-021-10612-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-021-10612-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,5,25]],"date-time":"2021-05-25T05:09:19Z","timestamp":1621919359000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-021-10612-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,3,10]]},"references-count":58,"journal-issue":{"issue":"14","published-print":{"date-parts":[[2021,6]]}},"alternative-id":["10612"],"URL":"https:\/\/doi.org\/10.1007\/s11042-021-10612-w","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"value":"1380-7501","type":"print"},{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,3,10]]},"assertion":[{"value":"20 May 2020","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 November 2020","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 January 2021","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 March 2021","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}