{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,1]],"date-time":"2025-06-01T04:08:18Z","timestamp":1748750898758,"version":"3.41.0"},"reference-count":13,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,4,7]],"date-time":"2025-04-07T00:00:00Z","timestamp":1743984000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,4,7]],"date-time":"2025-04-07T00:00:00Z","timestamp":1743984000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,4,7]]},"DOI":"10.1109\/syscon64521.2025.11014869","type":"proceedings-article","created":{"date-parts":[[2025,5,30]],"date-time":"2025-05-30T17:43:30Z","timestamp":1748627010000},"page":"1-3","source":"Crossref","is-referenced-by-count":0,"title":["Operationalizing Common Crawl News: AI-Enabled Data Pipeline for Large-Scale News Analysis"],"prefix":"10.1109","author":[{"given":"Ameir","family":"El Ouadi","sequence":"first","affiliation":[{"name":"United States Military Academy,Department of Systems Engineering,West Point,NY,USA"}]},{"given":"William","family":"Knowlton","sequence":"additional","affiliation":[{"name":"United States Military Academy,Department of Systems Engineering,West Point,NY,USA"}]},{"given":"Adrian","family":"Pimentel","sequence":"additional","affiliation":[{"name":"United States Military Academy,Department of Systems Engineering,West Point,NY,USA"}]},{"given":"David","family":"Beskow","sequence":"additional","affiliation":[{"name":"United States Military Academy,Department of Systems Engineering,West Point,NY,USA"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/3630106.3659033"},{"journal-title":"Training data for the price of a sandwichl","year":"2024","author":"Baack","key":"ref2"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/SysCon61195.2024.10553540"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1146\/annurev.cs.03.060188.000323"},{"key":"ref5","article-title":"Fake news and phishing detection using a machine learning trained expert system","author":"Fitzpatrick","year":"2021","journal-title":"arXiv preprint"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.119509"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-021-10043-x"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2020.3028943"},{"key":"ref9","article-title":"Ccnet: Extracting high quality monolingual datasets from web crawl data","author":"Wenzek","year":"2019","journal-title":"arXiv preprint"},{"key":"ref10","article-title":"Languageagnostic bert sentence embedding","author":"Feng","year":"2020","journal-title":"arXiv preprint"},{"journal-title":"spacy: Industrial-strength natural language processing","year":"2020","author":"Honnibal","key":"ref11"},{"key":"ref12","article-title":"An outputbased evaluation framework for event extraction models","volume-title":"Proceedings of the Annual General Donald R. Keith Memorial Conference","author":"Brown","year":"2024"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/SysCon61195.2024.10553593"}],"event":{"name":"2025 IEEE International systems Conference (SysCon)","start":{"date-parts":[[2025,4,7]]},"location":"Montreal, QC, Canada","end":{"date-parts":[[2025,4,10]]}},"container-title":["2025 IEEE International systems Conference (SysCon)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11014641\/11014642\/11014869.pdf?arnumber=11014869","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,31]],"date-time":"2025-05-31T04:48:29Z","timestamp":1748666909000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11014869\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4,7]]},"references-count":13,"URL":"https:\/\/doi.org\/10.1109\/syscon64521.2025.11014869","relation":{},"subject":[],"published":{"date-parts":[[2025,4,7]]}}}