{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:09:54Z","timestamp":1750219794173,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":24,"publisher":"ACM","license":[{"start":{"date-parts":[[2022,11,7]],"date-time":"2022-11-07T00:00:00Z","timestamp":1667779200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/501100004901","name":"Funda\u00e7\u00e3o de Amparo \u00e0 Pesquisa do Estado de Minas Gerais","doi-asserted-by":"publisher","award":["APQ-02176-21"],"award-info":[{"award-number":["APQ-02176-21"]}],"id":[{"id":"10.13039\/501100004901","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003593","name":"Conselho Nacional de Desenvolvimento Cient\u00edfico e Tecnol\u00f3gico","doi-asserted-by":"publisher","award":["406411\/2021-2"],"award-info":[{"award-number":["406411\/2021-2"]}],"id":[{"id":"10.13039\/501100003593","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2022,11,7]]},"DOI":"10.1145\/3539637.3557057","type":"proceedings-article","created":{"date-parts":[[2022,9,26]],"date-time":"2022-09-26T22:14:00Z","timestamp":1664230440000},"page":"142-149","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["A Cascade Approach for Gender Prediction from Texts in Portuguese Language"],"prefix":"10.1145","author":[{"given":"Jo\u00e3o Pedro Moreira","family":"de Morais","sequence":"first","affiliation":[{"name":"Department of Computer Science, Federal University of Lavras, Brazil"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Luiz Henrique de Campos","family":"Merschmann","sequence":"additional","affiliation":[{"name":"Department of Applied Computing, Federal University of Lavras, Brazil"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2022,11,7]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland, September 11-14, 2017(CEUR Workshop Proceedings, Vol.\u00a01866)","author":"Arcia Yaritza\u00a0Adame","year":"2017","unstructured":"Yaritza\u00a0Adame Arcia , Daniel Castro-Castro , Reynier\u00a0Ortega Bueno , and Rafael Mu\u00f1oz . 2017 . Author Profiling, instance-based Similarity Classification . In Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland, September 11-14, 2017(CEUR Workshop Proceedings, Vol.\u00a01866) . CEUR-WS.org. Yaritza\u00a0Adame Arcia, Daniel Castro-Castro, Reynier\u00a0Ortega Bueno, and Rafael Mu\u00f1oz. 2017. Author Profiling, instance-based Similarity Classification. In Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland, September 11-14, 2017(CEUR Workshop Proceedings, Vol.\u00a01866). CEUR-WS.org."},{"key":"e_1_3_2_1_2_1","volume-title":"N-gram: New groningen author-profiling model. https:\/\/doi.org\/10.48550\/ARXIV.1707.03764","author":"Basile Angelo","year":"2017","unstructured":"Angelo Basile , Gareth Dwyer , Maria Medvedeva , Josine Rawee , Hessel Haagsma , and Malvina Nissim . 2017 . N-gram: New groningen author-profiling model. https:\/\/doi.org\/10.48550\/ARXIV.1707.03764 10.48550\/ARXIV.1707.03764 Angelo Basile, Gareth Dwyer, Maria Medvedeva, Josine Rawee, Hessel Haagsma, and Malvina Nissim. 2017. N-gram: New groningen author-profiling model. https:\/\/doi.org\/10.48550\/ARXIV.1707.03764"},{"volume-title":"Natural language processing with Python: analyzing text with the natural language toolkit. O\u2019Reilly Media","author":"Bird Steven","key":"e_1_3_2_1_3_1","unstructured":"Steven Bird , Ewan Klein , and Edward Loper . 2009. Natural language processing with Python: analyzing text with the natural language toolkit. O\u2019Reilly Media , Inc . Steven Bird, Ewan Klein, and Edward Loper. 2009. Natural language processing with Python: analyzing text with the natural language toolkit. O\u2019Reilly Media, Inc."},{"key":"#cr-split#-e_1_3_2_1_4_1.1","unstructured":"Alina\u00a0Maria Ciobanu Marcos Zampieri Shervin Malmasi and Liviu\u00a0P. Dinu. 2017. Including dialects and language varieties in author profiling. https:\/\/doi.org\/10.48550\/ARXIV.1707.00621 10.48550\/ARXIV.1707.00621"},{"key":"#cr-split#-e_1_3_2_1_4_1.2","unstructured":"Alina\u00a0Maria Ciobanu Marcos Zampieri Shervin Malmasi and Liviu\u00a0P. Dinu. 2017. Including dialects and language varieties in author profiling. https:\/\/doi.org\/10.48550\/ARXIV.1707.00621"},{"key":"#cr-split#-e_1_3_2_1_5_1.1","doi-asserted-by":"crossref","unstructured":"Jo\u00e3o\u00a0Pedro de Morais and Luiz\u00a0Henrique Merschmann. 2021. Uma Abordagem H\u00edbrida para Predi\u00e7\u00e3o de G\u00eanero a partir de Textos em Portugu\u00eas. In Anais do XXXVI Simp\u00f3sio Brasileiro de Bancos de Dados (Rio de Janeiro). SBC Porto Alegre RS Brasil 49-60. https:\/\/doi.org\/10.5753\/sbbd.2021.17865 10.5753\/sbbd.2021.17865","DOI":"10.5753\/sbbd.2021.17865"},{"key":"#cr-split#-e_1_3_2_1_5_1.2","doi-asserted-by":"crossref","unstructured":"Jo\u00e3o\u00a0Pedro de Morais and Luiz\u00a0Henrique Merschmann. 2021. Uma Abordagem H\u00edbrida para Predi\u00e7\u00e3o de G\u00eanero a partir de Textos em Portugu\u00eas. In Anais do XXXVI Simp\u00f3sio Brasileiro de Bancos de Dados (Rio de Janeiro). SBC Porto Alegre RS Brasil 49-60. https:\/\/doi.org\/10.5753\/sbbd.2021.17865","DOI":"10.5753\/sbbd.2021.17865"},{"key":"e_1_3_2_1_6_1","volume-title":"Proceedings of The 12th Language Resources and Evaluation Conference. European Language Resources Association","author":"Dias Rafael","year":"2020","unstructured":"Rafael Dias and Ivandr\u00e9 Paraboni . 2020 . Cross-domain Author Gender Classification in Brazilian Portuguese . In Proceedings of The 12th Language Resources and Evaluation Conference. European Language Resources Association , Marseille, France, 1227\u20131234. Rafael Dias and Ivandr\u00e9 Paraboni. 2020. Cross-domain Author Gender Classification in Brazilian Portuguese. In Proceedings of The 12th Language Resources and Evaluation Conference. European Language Resources Association, Marseille, France, 1227\u20131234."},{"key":"e_1_3_2_1_7_1","volume-title":"BlogSet-BR: A Brazilian Portuguese Blog Corpus. In 11th International Conference on Language Resources and Evaluation. ELRA","author":"dos Santos Henrique","year":"2018","unstructured":"Henrique D.\u00a0P. dos Santos , Vinicius Woloszyn , and Renata Vieira . 2018 . BlogSet-BR: A Brazilian Portuguese Blog Corpus. In 11th International Conference on Language Resources and Evaluation. ELRA , Miyazaki, Japan, 1110\u20131123. Henrique D.\u00a0P. dos Santos, Vinicius Woloszyn, and Renata Vieira. 2018. BlogSet-BR: A Brazilian Portuguese Blog Corpus. In 11th International Conference on Language Resources and Evaluation. ELRA, Miyazaki, Japan, 1110\u20131123."},{"key":"e_1_3_2_1_8_1","volume-title":"Exsense: Extract sensitive information from unstructured data. Computers & Security(2021). https:\/\/doi.org\/10.1016\/j.cose.2020.102156","author":"Guo Yongyan","year":"2021","unstructured":"Yongyan Guo , Jiayong Liu , Wenwu Tang , and Cheng Huang . 2021 . Exsense: Extract sensitive information from unstructured data. Computers & Security(2021). https:\/\/doi.org\/10.1016\/j.cose.2020.102156 10.1016\/j.cose.2020.102156 Yongyan Guo, Jiayong Liu, Wenwu Tang, and Cheng Huang. 2021. Exsense: Extract sensitive information from unstructured data. Computers & Security(2021). https:\/\/doi.org\/10.1016\/j.cose.2020.102156"},{"key":"e_1_3_2_1_9_1","volume-title":"Proceedings of the Eleventh International Conference on Language Resources and Evaluation. European Language Resources Association","author":"Hsieh Fernando","year":"2018","unstructured":"Fernando Hsieh , Rafael Dias , and Ivandr\u00e9 Paraboni . 2018 . Author Profiling from Facebook Corpora . In Proceedings of the Eleventh International Conference on Language Resources and Evaluation. European Language Resources Association , Miyazaki, Japan, 1210\u2013132. Fernando Hsieh, Rafael Dias, and Ivandr\u00e9 Paraboni. 2018. Author Profiling from Facebook Corpora. In Proceedings of the Eleventh International Conference on Language Resources and Evaluation. European Language Resources Association, Miyazaki, Japan, 1210\u2013132."},{"key":"e_1_3_2_1_10_1","volume-title":"Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland","author":"Markov Ilia","year":"2017","unstructured":"Ilia Markov , Helena G\u00f3mez-Adorno , and Grigori Sidorov . 2017. Language-and Subtask-Dependent Feature Selection and Classifier Parameter Tuning for Author Profiling . In Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland , September 11-14, 2017 (CEUR Workshop Proceedings, Vol .\u00a01866). CEUR-WS. org. Ilia Markov, Helena G\u00f3mez-Adorno, and Grigori Sidorov. 2017. Language-and Subtask-Dependent Feature Selection and Classifier Parameter Tuning for Author Profiling. In Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland, September 11-14, 2017(CEUR Workshop Proceedings, Vol.\u00a01866). CEUR-WS.org."},{"key":"e_1_3_2_1_11_1","volume-title":"Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland","author":"Martinc Matej","year":"2017","unstructured":"Matej Martinc , Iza Skrjanec , Katja Zupan , and Senja Pollak . 2017. PAN 2017: Author Profiling-Gender and Language Variety Prediction . In Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland , September 11-14, 2017 (CEUR Workshop Proceedings, Vol .\u00a01866). CEUR-WS. org. Matej Martinc, Iza Skrjanec, Katja Zupan, and Senja Pollak. 2017. PAN 2017: Author Profiling-Gender and Language Variety Prediction. In Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland, September 11-14, 2017(CEUR Workshop Proceedings, Vol.\u00a01866). CEUR-WS.org."},{"key":"e_1_3_2_1_12_1","volume-title":"Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland, September 11-14, 2017(CEUR Workshop Proceedings, Vol.\u00a01866)","author":"Miura Yasuhide","year":"2017","unstructured":"Yasuhide Miura , Tomoki Taniguchi , Motoki Taniguchi , and Tomoko Ohkuma . 2017 . Author Profiling with Word+Character Neural Attention Network . In Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland, September 11-14, 2017(CEUR Workshop Proceedings, Vol.\u00a01866) . CEUR-WS.org. Yasuhide Miura, Tomoki Taniguchi, Motoki Taniguchi, and Tomoko Ohkuma. 2017. Author Profiling with Word+Character Neural Attention Network. In Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland, September 11-14, 2017(CEUR Workshop Proceedings, Vol.\u00a01866). CEUR-WS.org."},{"key":"e_1_3_2_1_13_1","volume-title":"Study of Language and Age in Twitter. In Seventh International AAAI Conference on Weblogs and Social Media. International Conference on Weblogs and Social Media, Massachusetts USA.","author":"Nguyen Dong","year":"2013","unstructured":"Dong Nguyen , Rilana Gravel , Dolf Trieschnigg , and Theo Meder . 2013 . \u201d How Old Do You Think I Am?\u201d A Study of Language and Age in Twitter. In Seventh International AAAI Conference on Weblogs and Social Media. International Conference on Weblogs and Social Media, Massachusetts USA. Dong Nguyen, Rilana Gravel, Dolf Trieschnigg, and Theo Meder. 2013. \u201dHow Old Do You Think I Am?\u201d A Study of Language and Age in Twitter. In Seventh International AAAI Conference on Weblogs and Social Media. International Conference on Weblogs and Social Media, Massachusetts USA."},{"key":"e_1_3_2_1_14_1","volume-title":"Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland, September 11-14, 2017(CEUR Workshop Proceedings, Vol.\u00a01866)","author":"Manuel\u00a0Rangel Pardo Francisco","year":"2017","unstructured":"Francisco Manuel\u00a0Rangel Pardo , Paolo Rosso , Martin Potthast , and Benno Stein . 2017 . Overview of the 5th Author Profiling Task at PAN 2017: Gender and Language Variety Identification in Twitter . In Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland, September 11-14, 2017(CEUR Workshop Proceedings, Vol.\u00a01866) , Linda Cappellato, Nicola Ferro, Lorraine Goeuriot, and Thomas Mandl (Eds.). CEUR-WS.org. Francisco Manuel\u00a0Rangel Pardo, Paolo Rosso, Martin Potthast, and Benno Stein. 2017. Overview of the 5th Author Profiling Task at PAN 2017: Gender and Language Variety Identification in Twitter. In Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland, September 11-14, 2017(CEUR Workshop Proceedings, Vol.\u00a01866), Linda Cappellato, Nicola Ferro, Lorraine Goeuriot, and Thomas Mandl (Eds.). CEUR-WS.org."},{"key":"e_1_3_2_1_15_1","unstructured":"Fabian Pedregosa Ga\u00ebl Varoquaux Alexandre Gramfort Vincent Michel Bertrand Thirion Olivier Grisel Mathieu Blondel Peter Prettenhofer Ron Weiss Vincent Dubourg Jake Vanderplas Alexandre Passos David Cournapeau Matthieu Brucher Matthieu Perrot and \u00c9douard Duchesnay. 2011. Scikit-Learn: Machine Learning in Python. Journal of Machine Learning Research(2011) 2825\u20132830.  Fabian Pedregosa Ga\u00ebl Varoquaux Alexandre Gramfort Vincent Michel Bertrand Thirion Olivier Grisel Mathieu Blondel Peter Prettenhofer Ron Weiss Vincent Dubourg Jake Vanderplas Alexandre Passos David Cournapeau Matthieu Brucher Matthieu Perrot and \u00c9douard Duchesnay. 2011. Scikit-Learn: Machine Learning in Python. Journal of Machine Learning Research(2011) 2825\u20132830."},{"key":"e_1_3_2_1_16_1","volume-title":"Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland, September 11-14, 2017(CEUR Workshop Proceedings, Vol.\u00a01866)","author":"Poulston Adam","year":"2017","unstructured":"Adam Poulston , Zeerak Waseem , and Mark Stevenson . 2017 . Using TF-IDF n-gram and Word Embedding Cluster Ensembles for Author Profiling . In Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland, September 11-14, 2017(CEUR Workshop Proceedings, Vol.\u00a01866) . CEUR-WS.org. Adam Poulston, Zeerak Waseem, and Mark Stevenson. 2017. Using TF-IDF n-gram and Word Embedding Cluster Ensembles for Author Profiling. In Working Notes of CLEF 2017 - Conference and Labs of the Evaluation Forum, Dublin, Ireland, September 11-14, 2017(CEUR Workshop Proceedings, Vol.\u00a01866). CEUR-WS.org."},{"key":"e_1_3_2_1_17_1","volume-title":"Proceedings of the Eleventh International Conference on Language Resources and Evaluation. European Language Resources Association","author":"Ramos Ricelli","year":"2018","unstructured":"Ricelli Ramos , Georges Neto , Barbara Silva , Danielle Monteiro , Ivandr\u00e9 Paraboni , and Rafael Dias . 2018 . Building a corpus for personality-dependent natural language understanding and generation . In Proceedings of the Eleventh International Conference on Language Resources and Evaluation. European Language Resources Association , Miyazaki, Japan, 1138\u20131145. Ricelli Ramos, Georges Neto, Barbara Silva, Danielle Monteiro, Ivandr\u00e9 Paraboni, and Rafael Dias. 2018. Building a corpus for personality-dependent natural language understanding and generation. In Proceedings of the Eleventh International Conference on Language Resources and Evaluation. European Language Resources Association, Miyazaki, Japan, 1138\u20131145."},{"key":"e_1_3_2_1_18_1","volume-title":"CLEF 2015 Evaluation Labs and Workshop Working Notes Papers. 1\u20138.","author":"Rangel\u00a0Pardo Francisco\u00a0Manuel","year":"2015","unstructured":"Francisco\u00a0Manuel Rangel\u00a0Pardo , Fabio Celli , Paolo Rosso , Martin Potthast , Benno Stein , and Walter Daelemans . 2015 . Overview of the 3rd Author Profiling Task at PAN 2015 . In CLEF 2015 Evaluation Labs and Workshop Working Notes Papers. 1\u20138. Francisco\u00a0Manuel Rangel\u00a0Pardo, Fabio Celli, Paolo Rosso, Martin Potthast, Benno Stein, and Walter Daelemans. 2015. Overview of the 3rd Author Profiling Task at PAN 2015. In CLEF 2015 Evaluation Labs and Workshop Working Notes Papers. 1\u20138."},{"key":"e_1_3_2_1_19_1","volume-title":"XII Symposium in Information and Human Language Technology and Collocates Events. STIL, Salvador, BA, 200\u2013208","author":"Real Livy","year":"2019","unstructured":"Livy Real , Marcio Oshiro , and Alexandre Mafra . 2019 . B2W-Reviews01 An open product reviews corpus . In XII Symposium in Information and Human Language Technology and Collocates Events. STIL, Salvador, BA, 200\u2013208 . Livy Real, Marcio Oshiro, and Alexandre Mafra. 2019. B2W-Reviews01 An open product reviews corpus. In XII Symposium in Information and Human Language Technology and Collocates Events. STIL, Salvador, BA, 200\u2013208."},{"key":"e_1_3_2_1_20_1","volume-title":"Proceedings of the International Conference on Recent Advances in Natural Language Processing. INCOMA Ltd","author":"Santos Wesley","year":"2019","unstructured":"Wesley Santos and Ivandr\u00e9 Paraboni . 2019 . Moral Stance Recognition and Polarity Classification from Twitter and Elicited Text . In Proceedings of the International Conference on Recent Advances in Natural Language Processing. INCOMA Ltd , Varna, Bulgaria, 1148\u20131160. https:\/\/doi.org\/10.26615\/978-954-452-056-4_123 10.26615\/978-954-452-056-4_123 Wesley Santos and Ivandr\u00e9 Paraboni. 2019. Moral Stance Recognition and Polarity Classification from Twitter and Elicited Text. In Proceedings of the International Conference on Recent Advances in Natural Language Processing. INCOMA Ltd, Varna, Bulgaria, 1148\u20131160. https:\/\/doi.org\/10.26615\/978-954-452-056-4_123"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1121"},{"key":"e_1_3_2_1_22_1","volume-title":"\u00a0Carvalho Carvalho","author":"Vicente Marco","year":"2019","unstructured":"Marco Vicente , Fernando Batista , and Joao P . \u00a0Carvalho Carvalho . 2019 . Gender Detection of Twitter Users Based on Multiple Information Sources. Springer International Publishing , Berna, SW, 39\u201354. https:\/\/doi.org\/10.1007\/978-3-030-01632-6_3 10.1007\/978-3-030-01632-6_3 Marco Vicente, Fernando Batista, and Joao P.\u00a0Carvalho Carvalho. 2019. Gender Detection of Twitter Users Based on Multiple Information Sources. Springer International Publishing, Berna, SW, 39\u201354. https:\/\/doi.org\/10.1007\/978-3-030-01632-6_3"}],"event":{"name":"WebMedia '22: Brazilian Symposium on Multimedia and Web","sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","SIGMM ACM Special Interest Group on Multimedia"],"location":"Curitiba Brazil","acronym":"WebMedia '22"},"container-title":["Proceedings of the Brazilian Symposium on Multimedia and the Web"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3539637.3557057","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3539637.3557057","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T16:38:03Z","timestamp":1750178283000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3539637.3557057"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,11,7]]},"references-count":24,"alternative-id":["10.1145\/3539637.3557057","10.1145\/3539637"],"URL":"https:\/\/doi.org\/10.1145\/3539637.3557057","relation":{},"subject":[],"published":{"date-parts":[[2022,11,7]]},"assertion":[{"value":"2022-11-07","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}