{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T04:57:02Z","timestamp":1755838622564,"version":"3.40.3"},"publisher-location":"Cham","reference-count":18,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319669168"},{"type":"electronic","value":"9783319669175"}],"license":[{"start":{"date-parts":[[2017,1,1]],"date-time":"2017-01-01T00:00:00Z","timestamp":1483228800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017]]},"DOI":"10.1007\/978-3-319-66917-5_25","type":"book-chapter","created":{"date-parts":[[2017,8,24]],"date-time":"2017-08-24T07:14:52Z","timestamp":1503558892000},"page":"375-393","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Migrating Web Archives from HTML4 to HTML5: A Block-Based Approach and Its Evaluation"],"prefix":"10.1007","author":[{"given":"Andr\u00e9s","family":"Sanoja","sequence":"first","affiliation":[]},{"given":"St\u00e9phane","family":"Gan\u00e7arski","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,8,25]]},"reference":[{"issue":"2","key":"25_CR1","doi-asserted-by":"publisher","first-page":"93","DOI":"10.1080\/17445760802429585","volume":"25","author":"J Cao","year":"2010","unstructured":"Cao, J., Mao, B., Luo, J.: A segmentation method for web page analysis using shrinking and dividing. Int. J. Parallel Emergent Distrib. Syst. 25(2), 93\u2013104 (2010)","journal-title":"Int. J. Parallel Emergent Distrib. Syst."},{"key":"25_CR2","unstructured":"Garret, J.: Preserving digital information. Technical report, Commission on Preservation and Access and the Research Libraries Group (1996)"},{"key":"25_CR3","unstructured":"Jackson, A.N.: Formats over time: exploring UK web history. CoRR, pp. 1210\u20131714 (2012)"},{"key":"25_CR4","doi-asserted-by":"crossref","unstructured":"Kohlsch\u00fctter, C., Nejdl, W.: A densitometric approach to web page segmentation. In: Proceedings of the 17th ACM Conference on Information and Knowledge Management, pp. 1173\u20131182, New York, NY, USA. ACM (2008)","DOI":"10.1145\/1458082.1458237"},{"issue":"2","key":"25_CR5","first-page":"41","volume":"36","author":"B Laws","year":"2013","unstructured":"Laws, B.: Seriously, another format? You must be kidding. CSE News 36(2), 41 (2013)","journal-title":"CSE News"},{"key":"25_CR6","doi-asserted-by":"publisher","unstructured":"Lin, S.-H., Ho, J.-M.: Discovering informative content blocks from web documents. In: Proceedings of the Eighth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD 2002, pp. 588\u2013593, Edmonton, Alberta, Canada. ACM (2002). ISBN: 1-58113-567-X. doi:10.1145\/775047.775134","DOI":"10.1145\/775047.775134"},{"key":"25_CR7","unstructured":"Moreau, E., Yvon, F., Capp\u00e9, O.: Robust similarity measures for named entities matching. In: Proceedings of the 22Nd International Conference on Computational Linguistics, vol. 1, COLING 2008, pp. 593\u2013600, Stroudsburg, PA, USA. Association for Computational Linguistics (2008). ISBN: 978-1-905593-44-6, http:\/\/dl.acm.org\/citation.cfm?id=1599081.1599156"},{"issue":"1","key":"25_CR8","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1145\/375360.375365","volume":"33","author":"G Navarro","year":"2001","unstructured":"Navarro, G.: A guided tour to approximate string matching. ACM Comput. Surv. 33(1), 31\u201388 (2001). doi:10.1145\/375360.375365. ISSN: 0360-0300","journal-title":"ACM Comput. Surv."},{"key":"25_CR9","unstructured":"Niwattanakul, S., Singthongchai, J., Naenudorn, E., Wanapu, S.: Using of Jaccard coefficient for keywords similarity. In: Proceedings of the International MultiConference of Engineers and Computer Scientists, vol. 1, pp. 13\u201315 (2013)"},{"key":"25_CR10","unstructured":"Park, S.H., Lynberg, N., Racer, J., McElmurray, P., Fox, E.A.: Html5 etds. In: Proceedings of International Symposium on Electronic thesis and Dissertations, Austin, TX, USA (2010)"},{"key":"25_CR11","doi-asserted-by":"crossref","unstructured":"Rosenthal, D.S.H., Lipkis, T., Robertson, T., Morabito, S.: Transparent format migration of preserved web content. D-Lib Mag. 11(1) (2005). http:\/\/dblp.uni-trier.de\/db\/journals\/dlib\/dlib11.html#RosenthalLRM05","DOI":"10.1045\/january2005-rosenthal"},{"issue":"2","key":"25_CR12","doi-asserted-by":"publisher","first-page":"195","DOI":"10.1108\/07378831011047613","volume":"28","author":"DSH Rosenthal","year":"2010","unstructured":"Rosenthal, D.S.H.: Format obsolescence: assessing the threat and the defenses. Libr. Hi Tech 28(2), 195\u2013210 (2010)","journal-title":"Libr. Hi Tech"},{"key":"25_CR13","unstructured":"Sanoja, A.: Web page segmentation, evaluation and applications. PhD thesis, Universit\u00e9 Pierre et Marie Curie-Paris VI (2015). https:\/\/hal.inria.fr\/tel-01128002\/"},{"key":"25_CR14","doi-asserted-by":"crossref","unstructured":"Sanoja, A., Gan\u00e7arski, S.: Block-o-matic: a web page segmentation framework. In: International Conference on Multimedia Computing and Systems (ICMCS), pp. 595\u2013600, Marrakesh, Moroco, April 2014","DOI":"10.1109\/ICMCS.2014.6911249"},{"key":"25_CR15","doi-asserted-by":"crossref","unstructured":"Sanoja, A., Gan\u00e7arski, S.: Web page segmentation evaluation. In: Proceedings of the 30th Annual ACM Symposium on Applied Computing, pp. 753\u2013760. ACM (2015)","DOI":"10.1145\/2695664.2695786"},{"key":"25_CR16","unstructured":"Solis, B.: The conversation prism (2014). https:\/\/conversationprism.com"},{"issue":"2","key":"25_CR17","doi-asserted-by":"publisher","first-page":"123","DOI":"10.2218\/ijdc.v2i2.35","volume":"2","author":"J Van der Hoeven","year":"2007","unstructured":"Van der Hoeven, J.: Emulation for digital preservation in practice: the results. Int. J. Dig. Curation 2(2), 123\u2013132 (2007)","journal-title":"Int. J. Dig. Curation"},{"key":"25_CR18","unstructured":"W3Schools.com. HTML5 Migration: Migration from HTML4 to HTML5. W3Schools (2016). http:\/\/www.w3schools.com\/html\/html5_migration.asp"}],"container-title":["Lecture Notes in Computer Science","Advances in Databases and Information Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-66917-5_25","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,13]],"date-time":"2024-03-13T16:14:56Z","timestamp":1710346496000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-66917-5_25"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017]]},"ISBN":["9783319669168","9783319669175"],"references-count":18,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-66917-5_25","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2017]]},"assertion":[{"value":"25 August 2017","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}