{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,1,18]],"date-time":"2025-01-18T05:08:24Z","timestamp":1737176904643,"version":"3.33.0"},"reference-count":52,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,12,15]],"date-time":"2024-12-15T00:00:00Z","timestamp":1734220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,12,15]],"date-time":"2024-12-15T00:00:00Z","timestamp":1734220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,12,15]]},"DOI":"10.1109\/bigdata62323.2024.10825400","type":"proceedings-article","created":{"date-parts":[[2025,1,16]],"date-time":"2025-01-16T18:31:23Z","timestamp":1737052283000},"page":"1104-1113","source":"Crossref","is-referenced-by-count":0,"title":["Improving CLIP for Biomedical Retrieval: A Multi-Margin Contrastive Loss Approach"],"prefix":"10.1109","author":[{"given":"Ejan","family":"Shakya","sequence":"first","affiliation":[{"name":"University of Nebraska at Omaha,Department of Computer Science,Omaha,Nebraska,USA"}]},{"given":"Haritha Prasad","family":"Rayakota","sequence":"additional","affiliation":[{"name":"University of Nebraska at Omaha,Department of Computer Science,Omaha,Nebraska,USA"}]},{"given":"Pei-Chi","family":"Huang","sequence":"additional","affiliation":[{"name":"University of Nebraska at Omaha,Department of Computer Science,Omaha,Nebraska,USA"}]}],"member":"263","reference":[{"key":"ref1","first-page":"4904","article-title":"Scaling up visual and vision-language representation learning with noisy text supervision","volume-title":"International conference on machine learning","author":"Jia"},{"key":"ref2","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","volume-title":"International conference on machine learning","author":"Radford"},{"article-title":"Coca: Contrastive captioners are image-text foundation models","year":"2022","author":"Yu","key":"ref3"},{"article-title":"Florence: A new foundation model for computer vision","year":"2021","author":"Yuan","key":"ref4"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3626235"},{"key":"ref6","article-title":"Image captioners are scalable vision learners too","volume":"36","author":"Tschannen","year":"2024","journal-title":"Advances in Neural Information Processing Systems"},{"article-title":"Representation learning with contrastive predictive coding","year":"2018","author":"Oord","key":"ref7"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.98.2.381"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/133160.133199"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/1132956.1132959"},{"key":"ref11","volume-title":"Introduction to information retrieval","volume":"39","author":"Sch\u00fctze","year":"2008"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.7717\/peerj.1279"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/s10669-017-9670-5"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/BIBM55620.2022.9994867"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1201\/9781003132981-5"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1093\/nar\/gkaa333"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btl235"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1093\/database\/baz034"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btab331"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btz228"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"ref22","article-title":"Faster r-cnn: Towards real-time object detection with region proposal networks","volume":"28","author":"Ren","year":"2015","journal-title":"Advances in neural information processing systems"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1016\/j.procs.2019.09.207"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053405"},{"article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","year":"2021","author":"Dosovitskiy","key":"ref26"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"article-title":"Learning multiple layers of features from tiny images","year":"2009","author":"Krizhevsky","key":"ref28"},{"article-title":"Transunet: Transformers make strong encoders for medical image segmentation","year":"2021","author":"Chen","key":"ref29"},{"article-title":"Improving language understanding by generative pre-training","year":"2018","author":"Radford","key":"ref30"},{"article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","year":"2018","author":"Devlin","key":"ref31"},{"article-title":"Attention is all you need","year":"2023","author":"Vaswani","key":"ref32"},{"key":"ref33","article-title":"Xlnet: Generalized autoregressive pretraining for language understanding","volume":"32","author":"Yang","year":"2019","journal-title":"Advances in neural information processing systems"},{"article-title":"Roberta: A robustly optimized bert pretraining approach","year":"2019","author":"Liu","key":"ref34"},{"article-title":"Contrastive learning of medical visual representations from paired images and text. corr abs\/2010.00747 (2020)","year":"2020","author":"Zhang","key":"ref35"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00391"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19809-0_39"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-87196-3_26"},{"article-title":"Does clip benefit visual question answering in the medical domain as much as it does in the general domain?","year":"2021","author":"Eslami","key":"ref39"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01364-6_20"},{"article-title":"Self-supervised image-text pre-training with mixed data in chest x-rays","year":"2021","author":"Wang","key":"ref41"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.emnlp-main.256"},{"key":"ref43","first-page":"755","article-title":"Medaug: Contrastive learning leveraging patient metadata improves representations for chest x-ray interpretation","volume-title":"Machine Learning for Healthcare Conference","author":"Vu"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20059-5_1"},{"article-title":"Google\u2019s neural machine translation system: Bridging the gap between human and machine translation","year":"2016","author":"Wu","key":"ref45"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.coling-main.59"},{"article-title":"Elevater: A benchmark and toolkit for evaluating language-augmented visual models","year":"2022","author":"Li","key":"ref47"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-00934-2_24"},{"article-title":"Decoupled weight decay regularization","year":"2017","author":"Loshchilov","key":"ref49"},{"article-title":"A rotation-equivariant convolutional neural network model of primary visual cortex","year":"2018","author":"Ecker","key":"ref50"},{"article-title":"Lung and colon cancer histopathological image dataset (lc25000)","year":"2019","author":"Borkowski","key":"ref51"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1148\/ryai.2019180041"}],"event":{"name":"2024 IEEE International Conference on Big Data (BigData)","start":{"date-parts":[[2024,12,15]]},"location":"Washington, DC, USA","end":{"date-parts":[[2024,12,18]]}},"container-title":["2024 IEEE International Conference on Big Data (BigData)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10824975\/10824942\/10825400.pdf?arnumber=10825400","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,17]],"date-time":"2025-01-17T08:18:27Z","timestamp":1737101907000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10825400\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,15]]},"references-count":52,"URL":"https:\/\/doi.org\/10.1109\/bigdata62323.2024.10825400","relation":{},"subject":[],"published":{"date-parts":[[2024,12,15]]}}}