{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,8]],"date-time":"2026-02-08T11:19:06Z","timestamp":1770549546905,"version":"3.49.0"},"reference-count":53,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2004,8,1]],"date-time":"2004-08-01T00:00:00Z","timestamp":1091318400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Computers and the Humanities"],"published-print":{"date-parts":[[2004,8]]},"DOI":"10.1007\/s10579-004-8682-1","type":"journal-article","created":{"date-parts":[[2004,11,3]],"date-time":"2004-11-03T04:31:17Z","timestamp":1099456277000},"page":"253-270","source":"Crossref","is-referenced-by-count":17,"title":["Article: Collating Texts Using Progressive Multiple Alignment"],"prefix":"10.1007","volume":"38","author":[{"given":"Matthew","family":"Spencer","sequence":"first","affiliation":[]},{"given":"Christopher","family":"Howe","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"CR1","doi-asserted-by":"crossref","first-page":"839","DOI":"10.1038\/29667","volume":"394","author":"A.C. Barbrook","year":"1998","unstructured":"Barbrook A.C., Howe C.J., Blake N., Robinson P. (1998) The Phylogeny of The Canterbury Tales. Nature, 394, p.839.","journal-title":"Nature"},{"key":"CR2","volume-title":"The Canterbury Tales Project Occasional Papers","year":"1997","unstructured":"Blake N., Robinson P. (eds.) (1997) The Canterbury Tales Project Occasional Papers, Vol. II. Office for Humanities Communication Publications, London. 184 p."},{"key":"CR3","unstructured":"Brown M.P.S. (2000) Small Subunit Ribosomal RNA Modeling Using Stochastic Context-free Grammars. ISMB Proceedings 2000. American Association for Arti cial Intelligence, pp.57-66."},{"key":"CR4","doi-asserted-by":"crossref","first-page":"227","DOI":"10.9783\/9781512802450-014","volume-title":"Biological Metaphor and Cladistic Classification: An Interdisciplinary Perspective","author":"H.D. Cameron","year":"1987","unstructured":"Cameron H.D. (1987) The Upside-Down Cladogram:Problems in Manuscript Affiliation. In Hoenigswald, H.M., Wiener, L.F. (eds.), Biological Metaphor and Cladistic Classification: An Interdisciplinary Perspective. Frances Pinter, London, pp.227-242."},{"key":"CR5","doi-asserted-by":"crossref","first-page":"33","DOI":"10.1007\/BF02399140","volume":"10","author":"R.L. Cannon Jr.","year":"1976","unstructured":"Cannon R.L., Jr. (1976) OPCOL: An Optimal Text Collation Algorithm. Computers and the Humanities, 10, pp.33-40.","journal-title":"Computers and the Humanities"},{"key":"CR6","first-page":"152","volume-title":"Proceedings of the 40th Anniversary Meeting for the Association for Computational Lin-guistics (ACL-02)","author":"P. Clough","year":"2002","unstructured":"Clough P., Gaizauskas R., Piao S.S.L., Wilks Y. (2002) METER: MEasuring TExt Reuse. Proceedings of the 40th Anniversary Meeting for the Association for Computational Lin-guistics (ACL-02). University of Pennsylvania, Philadelphia, USA, pp.152-159."},{"key":"CR7","doi-asserted-by":"crossref","unstructured":"Cull P., Hsu T. (1999) Improved Parallel and Sequential Walking Tree Methods for Biological String Alignments. Supercomputing '99.","DOI":"10.1145\/331532.331583"},{"key":"CR8","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9780511790492","volume-title":"Biological Sequence Analysis","author":"R. Durbin","year":"1998","unstructured":"Durbin R., Eddy S., Krogh A., Mitchison G. (1998) Biological Sequence Analysis. Cambridge University Press, Cambridge. 356 p."},{"key":"CR9","doi-asserted-by":"crossref","first-page":"351","DOI":"10.1007\/BF02603120","volume":"25","author":"D.-F. Feng","year":"1987","unstructured":"Feng D.-F., Doolittle R.F. (1987) Progressive Sequence Alignment as a Prerequisite to Correct Phylogenetic Trees. Journal of Molecular Evolution, 25, pp.351-360.","journal-title":"Journal of Molecular Evolution"},{"key":"CR10","doi-asserted-by":"crossref","first-page":"705","DOI":"10.1016\/0022-2836(82)90398-9","volume":"162","author":"O. Gotoh","year":"1982","unstructured":"Gotoh O. (1982) An Improved Algorithm for Matching Biological Sequences. Journal of Molecular Biology, 162, pp.705-708.","journal-title":"Journal of Molecular Biology"},{"key":"CR11","doi-asserted-by":"crossref","first-page":"823","DOI":"10.1006\/jmbi.1996.0679","volume":"264","author":"O. Gotoh","year":"1996","unstructured":"Gotoh O. (1996) Significant Improvement in Accuracy of Multiple Protein Sequence Align-ments by Iterative Refinement as Assessed by Reference to Structural Alignments. Journal of Molecular Biology, 264, pp.823-838.","journal-title":"Journal of Molecular Biology"},{"key":"CR12","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1017\/CBO9780511597855.001","volume-title":"Natural Language Parsing: Psychological, Computational, and Theoretical Perspectives","author":"L. Karttunen","year":"1985","unstructured":"Karttunen L., Zwicky A.M. (1985) Introduction. In Dowty, D.R., Karttunen, L., Zwicky, A.M. (eds.), Natural Language Parsing: Psychological, Computational, and Theoretical Perspectives. Cambridge University Press, Cambridge, pp.1-25."},{"key":"CR13","doi-asserted-by":"crossref","first-page":"201","DOI":"10.1137\/1025045","volume":"25","author":"J.B. Kruskal","year":"1983","unstructured":"Kruskal J.B. (1983) An Overview of Sequence Comparison: Time Warps, String Edits, and Macromolecules. SIAM Review, 25, pp.201-237.","journal-title":"SIAM Review"},{"key":"CR14","doi-asserted-by":"crossref","first-page":"377","DOI":"10.1145\/146370.146380","volume":"24","author":"K. Kukich","year":"1992","unstructured":"Kukich K. (1992) Techniques for Automatically Correcting Words in Text. ACM Computing Surveys, 24, pp.377-439.","journal-title":"ACM Computing Surveys"},{"key":"CR15","unstructured":"Lantin A.-C., Baret P.V., Mac\u00e9 C. (2004) Phylogenetic Analysis of Gregory of Nazianzus Homily 27. Le poids des mots: Proceedings of the 7th International Conference on the Statistical Analysis of Textual Data. Louvain-la-Neuve, pp.700-707."},{"key":"CR16","doi-asserted-by":"crossref","first-page":"35","DOI":"10.1016\/0885-2308(90)90022-X","volume":"4","author":"K. Lari","year":"1990","unstructured":"Lari K., Young S.J. (1990) The Estimation of Stochastic Context-Free Grammars Using the Inside-Outside Algorithm. Computer Speech and Language, 4, pp.35-56.","journal-title":"Computer Speech and Language"},{"key":"CR17","first-page":"24","volume":"20","author":"A.R. Lee","year":"1989","unstructured":"Lee A.R. (1989) Numerical Taxonomy Revisited: John Griffith, Cladistic Analysis and St. Augustine's Quaestiones in Heptateuchem. Stadia Patristica, 20, pp.24-32.","journal-title":"Stadia Patristica"},{"key":"CR18","first-page":"261","volume-title":"Computers in Literary and Linguistic Research","author":"A.R. Lee","year":"1990","unstructured":"Lee A.R. (1990) BLUDGEON: A Blunt Instrument for the Analysis of Contamination in Textual Traditions. In Choueka, Y. (ed.), Computers in Literary and Linguistic Research. Champion-Slatkine, Paris, pp.261-292."},{"key":"CR19","doi-asserted-by":"crossref","first-page":"590","DOI":"10.1093\/sysbio\/46.4.590","volume":"46","author":"D.R. Maddison","year":"1997","unstructured":"Maddison D.R., Swofford D.L., Maddison W.P. (1997) NEXUS: An Extensible File Format for Systematic Information. Systematic Biology, 46, pp.590-621.","journal-title":"Systematic Biology"},{"key":"CR20","volume-title":"Foundations of Statistical Natural Language Processing","author":"C.D. Manning","year":"1999","unstructured":"Manning C.D., Sch\u00fctze H. (1999) Foundations of Statistical Natural Language Processing. The MIT Press, Cambridge, MA, 680 p."},{"key":"CR21","doi-asserted-by":"crossref","first-page":"275","DOI":"10.3406\/rht.2003.1514","volume":"31","author":"L.R. Mooney","year":"2001","unstructured":"Mooney L.R., Barbrook A.C., Howe C.J., Spencer M. (2001) Stemmatic Analysis of Lydgate 's ?Kings of England?: A Test Case for the Application of Software Developed for Evolu-tionary Biology to Manuscript Stemmatics. Revue d' Histoire des Textes, 31, pp.275-297.","journal-title":"Revue d' Histoire des Textes"},{"key":"CR22","doi-asserted-by":"crossref","first-page":"31","DOI":"10.1145\/375360.375365","volume":"33","author":"G. Navarro","year":"2001","unstructured":"Navarro G. (2001) A Guided Tour to Approximate String Matching. ACM Computing Sur-veys, 33, pp.31-88.","journal-title":"ACM Computing Sur-veys"},{"key":"CR23","first-page":"131","volume":"3","author":"C. Notredame","year":"2002","unstructured":"Notredame C. (2002) Recent Progresses in Multiple Sequence Alignment: A Survey. Phar-macogenomics, 3, pp.131-144.","journal-title":"Phar-macogenomics"},{"key":"CR24","doi-asserted-by":"crossref","first-page":"205","DOI":"10.1006\/jmbi.2000.4042","volume":"302","author":"C. Notredame","year":"2000","unstructured":"Notredame C., Higgins D.G., Heringa J. (2000) T-Coffee: A Novel Method for Fast and Accurate Multiple Sequence Alignment. Journal of Molecular Biology, 302, pp.205-217.","journal-title":"Journal of Molecular Biology"},{"key":"CR25","first-page":"41","volume-title":"Advances in Computer-Aided Literary and Linguistic Research","author":"W. Ott","year":"1979","unstructured":"Ott W. (1979) The Output of Collation Programs. In Ager, D.E., Knowles, F.E., Smith, J. (eds.), Advances in Computer-Aided Literary and Linguistic Research. Department of Modern Languages, University of Aston, Birmingham, pp.41-51."},{"key":"CR26","first-page":"205","volume-title":"Computers and Written Texts","author":"W. Ott","year":"1992","unstructured":"Ott W. (1992) Computers and Textual Editing. In Butler, C.S. (ed.), Computers and Written Texts, Blackwell, Oxford, pp.205-226."},{"key":"CR27","doi-asserted-by":"crossref","first-page":"93","DOI":"10.1093\/llc\/15.1.93","volume":"15","author":"W. Ott","year":"2000","unstructured":"Ott W. (2000) Strategies and Tools for Textual Scholarship: The T\u00fcbingen System of Text Processing Programs (TUSTEP). Literary and Linguistic Computing, 15, pp.93-108.","journal-title":"Literary and Linguistic Computing"},{"key":"CR28","doi-asserted-by":"crossref","first-page":"1447","DOI":"10.1002\/1097-024X(20001110)30:13<1447::AID-SPE344>3.0.CO;2-C","volume":"30","author":"E.G.M. Petrakis","year":"2000","unstructured":"Petrakis E.G.M., Tzeras K. (2000) Similarity Searching in the CORDIS Text Database. Software-Practice and Experience, 30, pp.1447-1464.","journal-title":"Software-Practice and Experience"},{"key":"CR29","doi-asserted-by":"crossref","first-page":"380","DOI":"10.2307\/2412794","volume":"26","author":"N.I. Platnick","year":"1977","unstructured":"Platnick N.I., Cameron H.D. (1977) Cladistic Methods in Textual, Linguistic, and Phyloge-netic Analysis. Systematic Zoology, 26, pp.380-385.","journal-title":"Systematic Zoology"},{"key":"CR30","doi-asserted-by":"crossref","first-page":"48","DOI":"10.1108\/EUM0000000007161","volume":"54","author":"A.M. Robertson","year":"1998","unstructured":"Robertson A.M., Willett P. (1998) Applications of n-grams in Textual Information Systems. Journal of Documentation, 54, pp.48-69.","journal-title":"Journal of Documentation"},{"key":"CR31","volume-title":"Collate 2:A User Guide","author":"P. Robinson","year":"1994","unstructured":"Robinson P. (1994a) Collate 2:A User Guide. Oxford University Computing Services, Oxford, 137 p."},{"key":"CR32","first-page":"69","volume-title":"The Canterbury Tales Project: Occasional Papers Vol. II","author":"P. Robinson","year":"1997","unstructured":"Robinson P. (1997) A Stemmatic Analysis of the Fifteenth-Century Witnesses to The Wife of Bath 's Prologue. In Blake, N., Robinson, P. (eds.), The Canterbury Tales Project: Occasional Papers Vol. II. Office for Humanities Communication Publications, London, pp. 69-132."},{"key":"CR33","doi-asserted-by":"crossref","first-page":"99","DOI":"10.1093\/llc\/4.2.99","volume":"4","author":"P.M.W. Robinson","year":"1989","unstructured":"Robinson P.M.W. (1989) The Collation and Textual Criticism of Icelandic Manuscripts. (1): Collation. Literary and Linguistic Computing, 4, pp.99-105.","journal-title":"Literary and Linguistic Computing"},{"key":"CR34","volume-title":"Collate: Interactive Collation of Large Textual Traditions","author":"P.M.W. Robinson","year":"1994","unstructured":"Robinson P.M.W. (1994b) Collate: Interactive Collation of Large Textual Traditions. Oxford University Centre for Humanities Computing, Oxford."},{"key":"CR35","first-page":"115","volume-title":"Research in Humanities Computing","author":"P.M.W. Robinson","year":"1996","unstructured":"Robinson P.M.W., O'Hara R.J. (1996) Cladistic Analysis of an Old Norse Manuscript Tra-dition. In Hockey, S., Ide, N. (eds.), Research in Humanities Computing 4. Oxford Uni-versity Press, Oxford, pp.115-137."},{"key":"CR36","volume-title":"Literary Computing","author":"C.F. Sabourin","year":"1994","unstructured":"Sabourin C.F. (1994) Literary Computing. Infolingua, Montreal, 581 p."},{"key":"CR37","doi-asserted-by":"crossref","first-page":"3","DOI":"10.1075\/z.79.03sal","volume-title":"Studies in Stemmatology","author":"B.J.P. Salemans","year":"1996","unstructured":"Salemans B.J.P. (1996) Cladistics or the Resurrection of the Method of Lachmann: On Building the Stemma of Yvain. In van Reenen, P., van Mulken, M. (eds.), Studies in Stemmatology. John Benjamins Publishing Company, Amsterdam, pp.3-70."},{"key":"CR38","volume-title":"Building Stemmas with the Computer in a Cladistic, Neo-Lach-mannian Way","author":"B.J.P. Saflemans","year":"2000","unstructured":"Saflemans B.J.P. (2000) Building Stemmas with the Computer in a Cladistic, Neo-Lach-mannian Way. Katholieke Universiteit, Nijmegen, 351 p."},{"key":"CR39","doi-asserted-by":"crossref","first-page":"1339","DOI":"10.1098\/rsta.2000.0590","volume":"358","author":"G. Sampson","year":"2000","unstructured":"Sampson G. (2000) The Role of Taxonomy in Language Engineering. Philosophical Trans-actions of the Royal Society of London Series A, 358, pp.1339-1355.","journal-title":"Philosophical Trans-actions of the Royal Society of London Series A"},{"key":"CR40","doi-asserted-by":"crossref","first-page":"503","DOI":"10.1016\/j.jtbi.2003.11.022","volume":"227","author":"M. Spencer","year":"2004","unstructured":"Spencer M., Davidson E.A., Barbrook A.C., Howe C.J. (2004a) Phylogenetics of Artificial Manuscripts. Journal of Theoretical Biology, 227, pp.503-511.","journal-title":"Journal of Theoretical Biology"},{"key":"CR41","doi-asserted-by":"crossref","first-page":"467","DOI":"10.1093\/llc\/16.4.467","volume":"16","author":"M. Spencer","year":"2001","unstructured":"Spencer M., Howe C.J. (2001) Estimating Distances between Manuscripts Based on Copying Errors. Literary and Linguistic Computing, 16, pp.467-484.","journal-title":"Literary and Linguistic Computing"},{"key":"CR42","doi-asserted-by":"crossref","unstructured":"Spencer M., Mooney L.R., Barbrook A.C., Bordalejo B., Howe C.J., Robinson P. (in press) The Effects of Weighting Kinds of Variants. In den Hollander, A. (ed.), Studies in Stemmatology II. John Benjamins Publishing Company, Amsterdam.","DOI":"10.1075\/z.125.13spe"},{"key":"CR43","unstructured":"Spencer M., Wachtel K., Howe C.J. (2002) The Greek Vorlage of the Syra Harclensis: A Comparative Study on Method in Exploring Textual Genealogy. TC: a Journal of Biblical Textual Criticism 7."},{"key":"CR44","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1023\/B:CHUM.0000009290.14571.59","volume":"38","author":"M. Spencer","year":"2004","unstructured":"Spencer M., Wachtel K., Howe C.J. (2004b) Representing Multiple Pathways of Textual Flow in the Greek Manuscripts of the Letter of James Using Reduced Median Networks. Computers and the Humanities, 38, pp.1-14.","journal-title":"Computers and the Humanities"},{"key":"CR45","unstructured":"Sperberg-McQueen C.M., Burnard L. (eds.) (2002) TEI P4:Guidelines for Electronic Text Encoding and Interchange. Text Encoding Initiative Consortium.XML Version, Oxford, Providence, Charlottesville, Bergen"},{"key":"CR46","doi-asserted-by":"crossref","first-page":"139","DOI":"10.1093\/llc\/18.2.139","volume":"18","author":"M. Stoliz","year":"2003","unstructured":"Stoliz M. (2003) New Philology and New Phylogeny:Aspects of a Critical Electronic Edition of Wolfram's Parzival. Literary and Linguistic Computing, 18, pp.139-150.","journal-title":"Literary and Linguistic Computing"},{"key":"CR47","first-page":"729","volume":"5","author":"J.A. Studier","year":"1988","unstructured":"Studier J.A., Keppler K.J. (1988) A Note on the Neighbor-Joining Algorithm of Saitou and Nei. Molecular Biology and Evolution, 5, pp.729-731.","journal-title":"Molecular Biology and Evolution"},{"key":"CR48","unstructured":"Thorpe J.C. (2002) Multivariate Statistical Analysis for Manuscript Classification. TC:A Journal of Biblical Textual Criticism, 7."},{"key":"CR49","doi-asserted-by":"crossref","unstructured":"Toutanova K., llhan H.T., Manning C.D. (2002) Extensions to HMM-Based Statistical Word Alignment Models. Proceedings of the 2002 Conference on Empirical Methods in Natural Language Processing, pp.87-94.","DOI":"10.3115\/1118693.1118705"},{"key":"CR50","doi-asserted-by":"crossref","first-page":"191","DOI":"10.1016\/0304-3975(92)90143-4","volume":"92","author":"E. Ukkonen","year":"1992","unstructured":"Ukkonen E. (1992) Approximate String-Matching with q-grams and Maximal Matches. Theoretical Computer Science, 92, pp.191-211.","journal-title":"Theoretical Computer Science"},{"key":"CR51","doi-asserted-by":"crossref","unstructured":"Wagner R.A. (1975) On the Complexity of the Extended String-to-String Correction Problem. Proceedings of the 7th Annual ACM Symposium on Theory of Computing, Albuquerque, New Mexico, pp.218-223.","DOI":"10.1145\/800116.803771"},{"key":"CR52","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-663-12401-6","volume-title":"Textual Criticism and Editorial Technique Applicable to Greek and Latin Texts","author":"M.L. West","year":"1973","unstructured":"West M.L. (1973) Textual Criticism and Editorial Technique Applicable to Greek and Latin Texts. B.G. Teubner, Stuttgart.155 p."},{"key":"CR53","doi-asserted-by":"crossref","unstructured":"Wise M.J. (1996) YAP3:Improved Detection of Similarities in Computer Program and Other Texts. SIGCSE '96, Philadelphia, USA, pp.130-134.","DOI":"10.1145\/236452.236525"}],"container-title":["Computers and the Humanities"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-004-8682-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10579-004-8682-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-004-8682-1","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,4,29]],"date-time":"2023-04-29T22:05:06Z","timestamp":1682805906000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10579-004-8682-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2004,8]]},"references-count":53,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2004,8]]}},"alternative-id":["5278682"],"URL":"https:\/\/doi.org\/10.1007\/s10579-004-8682-1","relation":{},"ISSN":["0010-4817","1572-8412"],"issn-type":[{"value":"0010-4817","type":"print"},{"value":"1572-8412","type":"electronic"}],"subject":[],"published":{"date-parts":[[2004,8]]}}}