{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,31]],"date-time":"2026-01-31T17:22:58Z","timestamp":1769880178312,"version":"3.49.0"},"reference-count":49,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2017,4,7]],"date-time":"2017-04-07T00:00:00Z","timestamp":1491523200000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Appl Intell"],"published-print":{"date-parts":[[2017,9]]},"DOI":"10.1007\/s10489-017-0911-6","type":"journal-article","created":{"date-parts":[[2017,4,7]],"date-time":"2017-04-07T00:11:01Z","timestamp":1491523861000},"page":"456-472","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["Termset weighting by adapting term weighting schemes to utilize cardinality statistics for binary text categorization"],"prefix":"10.1007","volume":"47","author":[{"given":"Dima","family":"Badawi","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8434-6345","authenticated-orcid":false,"given":"Hakan","family":"Alt\u0131n\u00e7ay","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,4,7]]},"reference":[{"key":"911_CR1","doi-asserted-by":"crossref","first-page":"30","DOI":"10.1007\/s10489-015-0745-z","volume":"45","author":"HK Kim","year":"2016","unstructured":"Kim HK, Kim M (2016) Model-induced term-weighting schemes for text classification. Appl Intell 45:30\u201343","journal-title":"Appl Intell"},{"key":"911_CR2","doi-asserted-by":"crossref","first-page":"104","DOI":"10.1016\/j.knosys.2016.03.029","volume":"103","author":"B Al-Salemi","year":"2016","unstructured":"Al-Salemi B, Noah SAM, Aziz MJA (2016) Rfboost: an improved multi-label boosting algorithm and its application to text categorisation. Knowl Based Syst 103:104\u2013117","journal-title":"Knowl Based Syst"},{"issue":"4","key":"911_CR3","doi-asserted-by":"crossref","first-page":"1941","DOI":"10.1016\/j.eswa.2014.10.011","volume":"42","author":"RHW Pinheiro","year":"2015","unstructured":"Pinheiro RHW, Cavalcanti GDC, Ren TI (2015) Data-driven global-ranking local feature selection methods for text categorization. Expert Syst Appl 42(4):1941\u20131949","journal-title":"Expert Syst Appl"},{"key":"911_CR4","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1016\/j.eswa.2016.03.041","volume":"57","author":"H Elghazel","year":"2016","unstructured":"Elghazel H, Aussem A, Gharroudi O, Saadaoui W (2016) Ensemble multi-label text categorization based on rotation forest and latent semantic indexing. Expert Syst Appl 57:1\u201311","journal-title":"Expert Syst Appl"},{"key":"911_CR5","doi-asserted-by":"crossref","first-page":"78","DOI":"10.1016\/j.procs.2013.09.083","volume":"22","author":"L Yang","year":"2013","unstructured":"Yang L, Li C, Ding Q, Li L (2013) Combining lexical and semantic features for short text classification. Procedia Comput Sci 22:78\u201386","journal-title":"Procedia Comput Sci"},{"issue":"1","key":"911_CR6","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/505282.505283","volume":"34","author":"F Sebastiani","year":"2002","unstructured":"Sebastiani F (2002) Machine learning in automated text categorization. ACM Comput Surv 34(1):1\u201347","journal-title":"ACM Comput Surv"},{"key":"911_CR7","doi-asserted-by":"crossref","first-page":"690","DOI":"10.1016\/j.eswa.2007.10.042","volume":"36","author":"Y Liu","year":"2009","unstructured":"Liu Y, Loh HT, Sun A (2009) Imbalanced text classification: a term weighting approach. Expert Syst Appl 36:690\u2013701","journal-title":"Expert Syst Appl"},{"key":"911_CR8","doi-asserted-by":"crossref","first-page":"5432","DOI":"10.1016\/j.eswa.2008.06.054","volume":"36","author":"J Chen","year":"2009","unstructured":"Chen J, Huang H, Tian S, Qu Y (2009) Feature selection for text classification with naive Bayes. Expert Syst Appl 36:5432\u20135435","journal-title":"Expert Syst Appl"},{"issue":"4","key":"911_CR9","doi-asserted-by":"crossref","first-page":"741","DOI":"10.1016\/j.ipm.2011.12.005","volume":"48","author":"J Yang","year":"2012","unstructured":"Yang J, Liu Y, Zhu X , Liu Z, Zhang X (2012) A new feature selection based on comprehensive measurement both in inter-category and intra-category for text categorization. Inf Process Manag 48(4):741\u2013754","journal-title":"Inf Process Manag"},{"key":"911_CR10","doi-asserted-by":"crossref","first-page":"784","DOI":"10.1145\/952532.952688","volume-title":"SAC\u201903: Proceedings of the 2003 ACM symposium on applied computing","author":"F Debole","year":"2003","unstructured":"Debole F, Sebastiani F (2003) Supervised term weighting for automated text categorization SAC\u201903: Proceedings of the 2003 ACM symposium on applied computing. ACM, New York, pp 784\u2013788"},{"issue":"4","key":"911_CR11","doi-asserted-by":"crossref","first-page":"137","DOI":"10.1016\/j.ipl.2012.11.005","volume":"113","author":"X Peng","year":"2013","unstructured":"Peng X, Yi Z, Wei XY, Peng DZ, Sang YS (2013) Free-gram phrase identification for modeling Chinese text. Inf Process Lett 113(4):137\u2013144","journal-title":"Inf Process Lett"},{"issue":"8","key":"911_CR12","doi-asserted-by":"crossref","first-page":"879","DOI":"10.1016\/j.knosys.2008.03.044","volume":"21","author":"W Zhang","year":"2008","unstructured":"Zhang W, Yoshida T, Tang X (2008) Text classification based on multi-word with support vector machine. Knowl-Based Syst 21(8):879\u2013886","journal-title":"Knowl-Based Syst"},{"issue":"3","key":"911_CR13","doi-asserted-by":"crossref","first-page":"2758","DOI":"10.1016\/j.eswa.2010.08.066","volume":"38","author":"W Zhang","year":"2011","unstructured":"Zhang W, Yoshida T, Tang X (2011) A comparative study of TF*IDF, LSI and multi-words for text classification. Expert Syst Appl 38(3):2758\u20132765","journal-title":"Expert Syst Appl"},{"key":"911_CR14","unstructured":"Bekkerman R, Allan J (2004) Using bigrams in text categorization. Technical Report IR-408. Center of Intelligent Information Retrieval, UMass Amherst"},{"issue":"5","key":"911_CR15","doi-asserted-by":"crossref","first-page":"843","DOI":"10.1016\/j.is.2011.02.002","volume":"36","author":"F Figueiredo","year":"2011","unstructured":"Figueiredo F, Rocha L, Couto T, Salles T, Gon\u00e7alves MA, Meira W (2011) Word co-occurrence features for text classification. Inf Syst 36(5):843\u2013858","journal-title":"Inf Syst"},{"key":"911_CR16","doi-asserted-by":"crossref","first-page":"138","DOI":"10.1145\/1166160.1166197","volume-title":"Proceedings of the 2006 ACM symposium on document engineering","author":"R Tesar","year":"2006","unstructured":"Tesar R, Strnad V, Jezek K, Poesio M (2006) Extending the single words-based document model: a comparison of bigrams and 2-itemsets Proceedings of the 2006 ACM symposium on document engineering. ACM, New York, pp 138\u2013146"},{"key":"911_CR17","doi-asserted-by":"crossref","first-page":"37","DOI":"10.1145\/133160.133172","volume-title":"Proceedings of the 15th annual international ACM SIGIR conference on research and development in information retrieval, SIGIR \u201992","author":"DD Lewis","year":"1992","unstructured":"Lewis DD (1992) An evaluation of phrasal and clustered representations on a text categorization task Proceedings of the 15th annual international ACM SIGIR conference on research and development in information retrieval, SIGIR \u201992. ACM, New York, pp 37\u201350"},{"key":"911_CR18","unstructured":"Boulis C, Ostendorf M (2005) Text classification by augmenting the bag-of-words representation with redundancy compensated bigrams. In: Proceedings of the international workshop on feature selection in data mining, in conjunction with SIAM SDM-05, pp 9\u201316"},{"key":"911_CR19","unstructured":"Lewis DD (1992) Representation and learning in information retrieval. PhD thesis, Amherst, MA, USA. UMI Order No. GAX92-19460"},{"key":"911_CR20","unstructured":"F\u00fcrnkranz J (1998) A study using n-gram features for text categorization. Technical Report OEFAI-TR-98-30, Austrian Research Institute for Artificial Intelligence, Austria"},{"issue":"12","key":"911_CR21","doi-asserted-by":"crossref","first-page":"1598","DOI":"10.1016\/j.patrec.2010.05.005","volume":"31","author":"L \u00d6zg\u00fcr","year":"2010","unstructured":"\u00d6zg\u00fcr L, G\u00fcng\u00f6r T (2010) Text classification with the support of pruned dependency patterns. Pattern Recogn Lett 31(12):1598\u20131607","journal-title":"Pattern Recogn Lett"},{"key":"911_CR22","doi-asserted-by":"crossref","unstructured":"Tan CM, Wang YF, Lee CD (2002) The use of bigrams to enhance text categorization. In: Information processing management, vol 38, pp 529\u2013546","DOI":"10.1016\/S0306-4573(01)00045-0"},{"key":"911_CR23","doi-asserted-by":"crossref","first-page":"38","DOI":"10.1016\/j.engappai.2014.06.012","volume":"35","author":"D Badawi","year":"2014","unstructured":"Badawi D, Alt\u0131n\u00e7ay H (2014) A novel framework for termset selection and weighting in binary text classification. Eng Appl Artif Intell 35:38\u201353","journal-title":"Eng Appl Artif Intell"},{"key":"911_CR24","doi-asserted-by":"crossref","first-page":"215","DOI":"10.1016\/j.ijpe.2014.12.035","volume":"165","author":"W Zong","year":"2015","unstructured":"Zong W, Wu F, Chu LK, Sculli D (2015) A discriminative and semantic feature selection method for text categorization. Int J Prod Econom 165:215\u2013222","journal-title":"Int J Prod Econom"},{"issue":"4","key":"911_CR25","doi-asserted-by":"crossref","first-page":"721","DOI":"10.1109\/TPAMI.2008.110","volume":"31","author":"M Lan","year":"2009","unstructured":"Lan M, Tan CL, Su J, Lu Y (2009) Supervised and traditional term weighting methods for automatic text categorization. IEEE Trans Pattern Anal Mach Intell 31(4):721\u2013735","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"911_CR26","doi-asserted-by":"crossref","first-page":"176","DOI":"10.1016\/j.knosys.2015.03.025","volume":"83","author":"HJ Escalante","year":"2015","unstructured":"Escalante HJ, Garc\u00eda-Limo\u0307n MA, Morales-Reyes A, Graff M, Montes-y-Go\u0307mez M, Morales EF, Mart\u00ednez-Carranza J (2015) Term-weighting learning via genetic programming for text classification. Knowl-Based Syst 83:176\u2013189","journal-title":"Knowl-Based Syst"},{"key":"911_CR27","doi-asserted-by":"crossref","first-page":"434","DOI":"10.1016\/j.neucom.2015.04.051","volume":"167","author":"MA Fattah","year":"2015","unstructured":"Fattah MA (2015) New term weighting schemes with combination of multiple classifiers for sentiment analysis. Neurocomputing 167:434\u2013442","journal-title":"Neurocomputing"},{"issue":"3","key":"911_CR28","first-page":"202","volume":"10","author":"L Zhang","year":"2012","unstructured":"Zhang L, Hu X, Qin S (2012) Word combination kernel for text categorization. J Digit Inf Manag 10 (3):202\u2013211","journal-title":"J Digit Inf Manag"},{"key":"911_CR29","volume-title":"Classifying text documents by associating terms with text categories. In: Proceedings of the 13th Australasian database conference - vol 5, ADC 02, pp 215\u2013222","author":"OR Zaiane","year":"2002","unstructured":"Zaiane OR, Antonie ML (2002) Classifying text documents by associating terms with text categories. In: Proceedings of the 13th Australasian database conference - vol 5, ADC 02, pp 215\u2013222. Australian Computer Society, Inc, Darlinghurst"},{"issue":"1","key":"911_CR30","first-page":"99","volume":"29","author":"M Yuan","year":"2013","unstructured":"Yuan M, Ouyang Y, Xiong Z (2013) A text categorization method using extended vector space model by frequent term sets. J Inf Sci Eng 29(1):99\u2013114","journal-title":"J Inf Sci Eng"},{"key":"911_CR31","doi-asserted-by":"crossref","unstructured":"Meretakis D, W\u00fcthrich B (1999) Extending na\u00efve Bayes classifiers using long itemsets. In: Proceedings of the fifth ACM SIGKDD international conference on knowledge discovery and data mining, KDD \u201999, pp 165\u2013174","DOI":"10.1145\/312129.312222"},{"issue":"4","key":"911_CR32","doi-asserted-by":"crossref","first-page":"397","DOI":"10.1145\/1095872.1095874","volume":"23","author":"B P\u00f4ssas","year":"2005","unstructured":"P\u00f4ssas B, Ziviani N, Meira W, Neto BR (2005) Set-based vector model: an efficient approach for correlation-based ranking. ACM Trans Inf Syst 23(4):397\u2013429","journal-title":"ACM Trans Inf Syst"},{"issue":"2","key":"911_CR33","doi-asserted-by":"crossref","first-page":"193","DOI":"10.1016\/j.ipm.2009.09.009","volume":"46","author":"CL Chen","year":"2010","unstructured":"Chen CL, Tseng FSC, Frank SC, Liang T (2010) Mining fuzzy frequent itemsets for hierarchical document clustering. Inf Process Manag 46(2):193\u2013211","journal-title":"Inf Process Manag"},{"issue":"6","key":"911_CR34","doi-asserted-by":"crossref","first-page":"823","DOI":"10.1007\/s13042-013-0172-6","volume":"5","author":"MH Mohamed","year":"2014","unstructured":"Mohamed MH, Darwieesh Mm M (2014) Efficient mining frequent itemsets algorithms. Int J Mach Learn Cybern 5(6):823\u2013833","journal-title":"Int J Mach Learn Cybern"},{"issue":"6","key":"911_CR35","doi-asserted-by":"crossref","first-page":"437","DOI":"10.1002\/widm.1074","volume":"2","author":"C Borgelt","year":"2012","unstructured":"Borgelt C (2012) Frequent item set mining. Wiley Interdisc Rew Data Min Knowl Discov 2(6):437\u2013456","journal-title":"Wiley Interdisc Rew Data Min Knowl Discov"},{"key":"911_CR36","doi-asserted-by":"crossref","unstructured":"Khan MS, Muyeba M, Coenen F Fuzzy weighted association rule mining with weighted support and confidence framework. In: New frontiers in applied data mining: PAKDD 2008 international workshops. Osaka, pp 49\u201361","DOI":"10.1007\/978-3-642-00399-8_5"},{"issue":"4","key":"911_CR37","doi-asserted-by":"crossref","first-page":"1256","DOI":"10.1016\/j.eswa.2012.08.065","volume":"40","author":"B Vo","year":"2013","unstructured":"Vo B, Coenen F, Le B (2013) A new method for mining frequent weighted itemsets based on wit-trees. Expert Syst Appl 40(4):1256\u20131264","journal-title":"Expert Syst Appl"},{"key":"911_CR38","doi-asserted-by":"crossref","unstructured":"Bernecker T, Kriegel HP, Renz M, Verhein F, Zuefle A (2009) Probabilistic frequent itemset mining in uncertain databases. In: Proceedings of the 15th ACM SIGKDD international conference on knowledge discovery and data mining, KDD \u201909, pp 119\u2013128","DOI":"10.1145\/1557019.1557039"},{"key":"911_CR39","doi-asserted-by":"crossref","unstructured":"Antonie M L, Zaiane OR (2002) Text document categorization by term association. In: Proceedings of IEEE international conference on data mining (ICDM\u20192002), pp 19\u201326","DOI":"10.1109\/ICDM.2002.1183881"},{"key":"911_CR40","unstructured":"Haralambous Y, Lenca P (2014) Text classification using association rules, dependency pruning and hyperonymization. In: Proceedings of the 1st international workshop on interactions between data mining and natural language processing co-located with the European conference on machine learning and principles and practice of knowledge discovery in databases, DMNLP@PKDD\/ECML 2014. France, pp 65\u201380"},{"key":"911_CR41","unstructured":"Rossi RG, Rezende SO (2010) The use of frequent itemsets extracted from textual documents for the classification task. In: WTI 2010: International workshop on web and text intelligence located on international joint conference (SBIA, SBRN, JRI), pp 1\u201310"},{"key":"911_CR42","doi-asserted-by":"crossref","unstructured":"Tsai RT, Hung H, Dai H, Lin Y, Hsu W (2008) Exploiting likely-positive and unlabeled data to improve the identification of protein-protein interaction articles. BMC Bioinform 9(Suppl 1)","DOI":"10.1186\/1471-2105-9-S1-S3"},{"issue":"3","key":"911_CR43","first-page":"819","volume":"27","author":"Z Erenel","year":"2011","unstructured":"Erenel Z, Alt\u0131n\u00e7ay H, Varo\u011flu E (2011) Explicit use of term occurrence probabilities for term weighting in text categorization. J Inf Sci Eng 27(3):819\u2013834","journal-title":"J Inf Sci Eng"},{"key":"911_CR44","doi-asserted-by":"crossref","first-page":"1310","DOI":"10.1016\/j.patrec.2010.03.012","volume":"31","author":"H Alt\u0131n\u00e7ay","year":"2010","unstructured":"Alt\u0131n\u00e7ay H, Erenel Z (2010) Analytical evaluation of term weighting schemes for text categorization. Pattern Recogn Lett 31:1310\u20131323","journal-title":"Pattern Recogn Lett"},{"key":"911_CR45","doi-asserted-by":"crossref","first-page":"148","DOI":"10.1007\/s10489-010-0250-3","volume":"36","author":"H Alt\u0131n\u00e7ay","year":"2012","unstructured":"Alt\u0131n\u00e7ay H, Erenel Z (2012) Using the absolute difference of term occurrence probabilities in binary text categorization. Appl Intell 36:148\u2013160","journal-title":"Appl Intell"},{"key":"911_CR46","unstructured":"Buckley C (1985) Implementation of the smart information retrieval system. Technical report, Cornell University. Ithaca"},{"issue":"3","key":"911_CR47","doi-asserted-by":"crossref","first-page":"130","DOI":"10.1108\/eb046814","volume":"14","author":"MF Porter","year":"1980","unstructured":"Porter MF (1980) An algorithm for suffix stripping. Program 14(3):130\u2013137","journal-title":"Program"},{"key":"911_CR48","doi-asserted-by":"crossref","first-page":"137","DOI":"10.1007\/BFb0026683","volume-title":"Proceedings of the 10th European conference on machine learning, ECML \u201998","author":"T Joachims","year":"1998","unstructured":"Joachims T (1998) Text categorization with suport vector machines: learning with many relevant features Proceedings of the 10th European conference on machine learning, ECML \u201998. Springer-Verlag, London, pp 137\u2013142"},{"key":"911_CR49","first-page":"169","volume-title":"Advances in kernel methods - support vector learning","author":"T Joachims","year":"1999","unstructured":"Joachims T (1999) Making large-scale SVM learning practical. In: Sch\u00f6lkoph B, Burges C J C, Smola A J (eds) Advances in kernel methods - support vector learning. MIT Press, Cambridge, pp 169\u2013184"}],"container-title":["Applied Intelligence"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10489-017-0911-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-017-0911-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-017-0911-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,9,20]],"date-time":"2019-09-20T15:11:09Z","timestamp":1568992269000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10489-017-0911-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,4,7]]},"references-count":49,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2017,9]]}},"alternative-id":["911"],"URL":"https:\/\/doi.org\/10.1007\/s10489-017-0911-6","relation":{},"ISSN":["0924-669X","1573-7497"],"issn-type":[{"value":"0924-669X","type":"print"},{"value":"1573-7497","type":"electronic"}],"subject":[],"published":{"date-parts":[[2017,4,7]]}}}