{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,19]],"date-time":"2025-12-19T15:46:21Z","timestamp":1766159181020,"version":"3.28.0"},"reference-count":46,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,6,18]],"date-time":"2023-06-18T00:00:00Z","timestamp":1687046400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,6,18]],"date-time":"2023-06-18T00:00:00Z","timestamp":1687046400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,6,18]]},"DOI":"10.1109\/ijcnn54540.2023.10192021","type":"proceedings-article","created":{"date-parts":[[2023,8,2]],"date-time":"2023-08-02T17:30:03Z","timestamp":1690997403000},"page":"1-8","source":"Crossref","is-referenced-by-count":1,"title":["Auto-TabTransformer: Hierarchical Transformers for Self and Semi Supervised Learning in Tabular Data"],"prefix":"10.1109","author":[{"given":"Akshay","family":"Sethi","sequence":"first","affiliation":[{"name":"AI Garage, Mastercard,Gurugram,India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sonia","family":"Gupta","sequence":"additional","affiliation":[{"name":"AI Garage, Mastercard,Gurugram,India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ayush","family":"Agarwal","sequence":"additional","affiliation":[{"name":"AI Garage, Mastercard,Gurugram,India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nancy","family":"Agrawal","sequence":"additional","affiliation":[{"name":"AI Garage, Mastercard,Gurugram,India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Siddhartha","family":"Asthana","sequence":"additional","affiliation":[{"name":"AI Garage, Mastercard,Gurugram,India"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939785"},{"key":"ref35","article-title":"Repre-sentation learning with contrastive predictive coding","author":"van den oord","year":"2018","journal-title":"ArXiv Preprint"},{"key":"ref12","article-title":"Why do tree-based models still outperform deep learning on typical tabular data?","author":"grinsztajn","year":"2022","journal-title":"Thirty-sixth Conference on Neural Information Processing Systems Datasets and Benchmarks Track"},{"key":"ref34","article-title":"Scarf: Self-supervised contrastive learning using random feature corruption","author":"bahri","year":"2021","journal-title":"ArXiv Preprint"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/0893-6080(90)90049-Q"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/3511808.3557699"},{"key":"ref14","first-page":"6638","article-title":"CatBoost: unbiased boosting with categorical features","author":"prokhorenkova","year":"2018","journal-title":"Advances in neural information processing systems"},{"key":"ref36","first-page":"18853","article-title":"Subtab: Subsetting features of tabular data for self-supervised representation learning","volume":"34","author":"ucar","year":"2021","journal-title":"Advances in neural information processing systems"},{"key":"ref31","article-title":"Saint: Improved neural networks for tabular data via row attention and contrastive pre-training","author":"somepalli","year":"2021","journal-title":"ArXiv Preprint"},{"key":"ref30","first-page":"28742","article-title":"Self-attention between datapoints: Going beyond individual input-output pairs in deep learning","volume":"34","author":"kossen","year":"2021","journal-title":"Advances in neural information processing systems"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1287\/mnsc.2016.2644"},{"key":"ref33","article-title":"mixup: Beyond empirical risk minimization","author":"zhang","year":"2017","journal-title":"ArXiv Preprint"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/3357384.3357925"},{"key":"ref32","first-page":"6023","article-title":"Cut-mix: Regularization strategy to train strong classifiers with localizable features","author":"yun","year":"2019","journal-title":"Proceedings of the IEEE\/CVF International Conference on Computer Vision"},{"key":"ref2","first-page":"2961","article-title":"Mask r-cnn","author":"he","year":"2017","journal-title":"Proceedings of the IEEE International Conference on Computer Vision"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1016\/j.tics.2020.09.004"},{"journal-title":"Int'l Conf on Learning Representations (ICLR)","year":"0","author":"balle","key":"ref39"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.3390\/technologies9010002"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1016\/S0893-6080(96)00110-4"},{"key":"ref19","first-page":"11033","article-title":"Vime: Extending the success of self-and semi-supervised learning to tabu-lar domain","volume":"33","author":"yoon","year":"2020","journal-title":"Advances in neural information processing systems"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICACCS51430.2021.9441668"},{"key":"ref24","article-title":"An image is worth 16&#x00D7;16 words: Transformers for image recognition at scale","author":"dosovitskiy","year":"2020","journal-title":"ArXiv Preprint"},{"key":"ref46","first-page":"189","article-title":"Comparative Accuracies of Neural Networks and Discriminant Analysis in Predicting Forest Cover Types from Cartographic Variables","author":"blackard","year":"1998","journal-title":"Second Southern Forestry GIS Conference"},{"key":"ref23","first-page":"12310","article-title":"Barlow twins: Self-supervised learning via redundancy reduction","author":"zbontar","year":"2021","journal-title":"International Conference on Machine Learning"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-01595-8_16"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.167"},{"key":"ref25","doi-asserted-by":"crossref","first-page":"21","DOI":"10.1109\/ICASSP39728.2021.9413901","article-title":"Attention is all you need in speech separation","author":"subakan","year":"2021","journal-title":"ICASSP 2021-2021 IEEE International Conference on Acoustics Speech and Signal Processing (ICASSP)"},{"key":"ref20","first-page":"18932","article-title":"Revisiting deep learning models for tabular data","volume":"34","author":"gorishniy","year":"2021","journal-title":"Advances in neural information processing systems"},{"key":"ref42","first-page":"10524","article-title":"On layer normalization in the transformer architecture","author":"xiong","year":"2020","journal-title":"International Conference on Machine Learning"},{"journal-title":"A note on connecting barlow twins with negative-sample-free contrastive learning","year":"2021","author":"tsai","key":"ref41"},{"key":"ref22","first-page":"1597","article-title":"A simple framework for contrastive learning of visual representations","author":"chen","year":"2020","journal-title":"International Conference on Machine Learning"},{"key":"ref44","article-title":"Scaling Up the Accuracy of Naive-Bayes Classifiers: a Decision- Tree Hybrid","author":"kohavi","year":"1996","journal-title":"Proceedings of the Second International Con-ference on Knowledge Discovery and Data Mining"},{"key":"ref21","first-page":"5628","article-title":"A theoretical analysis of contrastive unsupervised representation learning","author":"saunshi","year":"2019","journal-title":"International Conference on Machine Learning"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.1994.576879"},{"journal-title":"Tabtransformer Tabular data modeling using contextual embeddings","year":"2020","author":"huang","key":"ref28"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i8.16826"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9414142"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.7551\/mitpress\/9780262033589.001.0001"},{"key":"ref7","first-page":"649","article-title":"Colorful image col-orization","author":"zhang","year":"2016","journal-title":"European Conference on Computer Vision"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/2988450.2988454"},{"key":"ref4","article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","author":"devlin","year":"2018","journal-title":"ArXiv Preprint"},{"key":"ref3","first-page":"5998","article-title":"Attention is all you need","author":"vaswani","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref6","first-page":"69","article-title":"Unsupervised learning of visual representations by solving jigsaw puzzles","author":"noroozi","year":"2016","journal-title":"European Conference on Computer Vision"},{"key":"ref5","article-title":"Unsupervised representation learning by predicting image rotations","author":"gidaris","year":"2018","journal-title":"ArXiv Preprint"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1996.8.4.773"}],"event":{"name":"2023 International Joint Conference on Neural Networks (IJCNN)","start":{"date-parts":[[2023,6,18]]},"location":"Gold Coast, Australia","end":{"date-parts":[[2023,6,23]]}},"container-title":["2023 International Joint Conference on Neural Networks (IJCNN)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10190990\/10190992\/10192021.pdf?arnumber=10192021","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,21]],"date-time":"2023-08-21T17:47:44Z","timestamp":1692640064000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10192021\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,6,18]]},"references-count":46,"URL":"https:\/\/doi.org\/10.1109\/ijcnn54540.2023.10192021","relation":{},"subject":[],"published":{"date-parts":[[2023,6,18]]}}}