{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,28]],"date-time":"2025-10-28T03:11:15Z","timestamp":1761621075129,"version":"3.38.0"},"reference-count":34,"publisher":"Springer Science and Business Media LLC","issue":"1-2","license":[{"start":{"date-parts":[[2011,9,22]],"date-time":"2011-09-22T00:00:00Z","timestamp":1316649600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Machine Translation"],"published-print":{"date-parts":[[2012,3]]},"DOI":"10.1007\/s10590-011-9102-0","type":"journal-article","created":{"date-parts":[[2011,9,21]],"date-time":"2011-09-21T03:38:43Z","timestamp":1316576323000},"page":"47-65","source":"Crossref","is-referenced-by-count":1,"title":["A comparison of segmentation methods and extended lexicon models for Arabic statistical machine translation"],"prefix":"10.1007","volume":"26","author":[{"given":"Sa\u0161a","family":"Hasan","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Saab","family":"Mansour","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hermann","family":"Ney","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2011,9,22]]},"reference":[{"key":"9102_CR1","doi-asserted-by":"crossref","unstructured":"Bar-Haim R, Sima\u2019an K, Winter Y (2005) Choosing an optimal architecture for segmentation and POS-tagging of modern Hebrew. In: Semitic \u201905: proceedings of the ACL workshop on computational approaches to semitic languages, Morristown, NJ, USA, pp 39\u201346","DOI":"10.3115\/1621787.1621796"},{"issue":"2","key":"9102_CR2","first-page":"263","volume":"19","author":"PF Brown","year":"1993","unstructured":"Brown PF, Della Pietra SA, Della Pietra VJ, Mercer RL (1993) The mathematics of statistical machine translation: parameter estimation. Comput Linguist 19(2): 263\u2013311","journal-title":"Comput Linguist"},{"key":"9102_CR3","unstructured":"Buckwalter T (2002) Buckwalter Arabic Morphological Analyzer Version 1.0. Linguistic Data Consortium, University of Pennsylvania. LDC Catalog No.: LDC2002L49"},{"key":"9102_CR4","unstructured":"Carpuat M, Wu D (2007) Improving statistical machine translation using word sense disambiguation. In: EMNLP-CoNLL 2007, Prague, Czech Republic"},{"key":"9102_CR5","unstructured":"Chan YS, Ng HT, Chiang D (2007) Word sense disambiguation improves statistical machine translation. In: Proceedings of the 45th annual meeting of the ACL, Prague, Czech Republic, pp 33\u201340"},{"key":"9102_CR6","doi-asserted-by":"crossref","unstructured":"Chang PC, Galley M, Manning CD (2008) Optimizing Chinese word segmentation for machine translation performance. In: StatMT\u201908: proceedings of the third workshop on SMT, Morristown, NJ, USA, pp 224\u2013232","DOI":"10.3115\/1626394.1626430"},{"issue":"4","key":"9102_CR7","doi-asserted-by":"crossref","first-page":"283","DOI":"10.1006\/csla.2000.0147","volume":"14","author":"C Chelba","year":"2000","unstructured":"Chelba C, Jelinek F (2000) Structured language modeling. Comput Speech Lang 14(4): 283\u2013332","journal-title":"Comput Speech Lang"},{"key":"9102_CR8","doi-asserted-by":"crossref","first-page":"78","DOI":"10.1007\/3-540-58473-0_139","volume-title":"Grammatical inference and applications, second international colloquium, ICGI-94, vol 862","author":"SA Della Pietra","year":"1994","unstructured":"Della Pietra SA, Della Pietra VJ, Gillett JR, Lafferty JD, Printz H, Ure\u0161 L (1994) Inference and estimation of a long-range trigram model. In: Oncina J, Carrasco RC (eds) Grammatical inference and applications, second international colloquium, ICGI-94, vol 862. Springer, Alicante, pp 78\u201392"},{"issue":"1","key":"9102_CR9","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1111\/j.2517-6161.1977.tb01600.x","volume":"39","author":"AP Dempster","year":"1977","unstructured":"Dempster AP, Laird NM, Rubin DB (1977) Maximum likelihood from incomplete data via the EM algorithm. J R Stat Soc B 39(1): 1\u201322","journal-title":"J R Stat Soc B"},{"key":"9102_CR10","doi-asserted-by":"crossref","unstructured":"Diab M, Hacioglu K, Jurafsky D (2004) Automatic tagging of Arabic text: from raw text to base phrase chunks. In: HLT-NAACL 2004: short papers, Boston, MA, USA, pp 149\u2013152","DOI":"10.3115\/1613984.1614022"},{"key":"9102_CR11","doi-asserted-by":"crossref","unstructured":"El Isbihani A, Khadivi S, Bender O, Ney H (2006) Morpho-syntactic Arabic preprocessing for Arabic to English statistical machine translation. In: Proceedings on the workshop on SMT, New York, pp 15\u201322","DOI":"10.3115\/1654650.1654654"},{"key":"9102_CR12","doi-asserted-by":"crossref","first-page":"263","DOI":"10.1007\/978-1-4020-6046-5_14","volume-title":"Arabic computational morphology, text, speech and language technology, vol 38","author":"N Habash","year":"2007","unstructured":"Habash N (2007) Arabic morphological representations for machine translation. In: Soudi A, Bosch Avd, Neumann G (eds) Arabic computational morphology, text, speech and language technology, vol 38. Springer, Netherlands, pp 263\u2013285"},{"key":"9102_CR13","doi-asserted-by":"crossref","unstructured":"Habash N, Rambow O (2005) Arabic tokenization, part-of-speech tagging and morphological disambiguation in one fell swoop. In: Proceedings of the 43rd annual meeting of the ACL, Morristown, NJ, USA, pp 573\u2013580","DOI":"10.3115\/1219840.1219911"},{"key":"9102_CR14","doi-asserted-by":"crossref","unstructured":"Habash N, Sadat F (2006) Arabic preprocessing schemes for statistical machine translation. In: HLT- NAACL 2006: short papers, New York, USA, pp 49\u201352","DOI":"10.3115\/1614049.1614062"},{"key":"9102_CR15","doi-asserted-by":"crossref","unstructured":"Habash N, Soudi A, Buckwalter T (2007) On Arabic transliteration. In: Ide N, V\u00e9ronis J, Soudi A, Bosch Avd, Neumann G (eds) Arabic computational morphology, text, speech and language technology, vol 38, Springer, Netherlands, pp 15\u201322","DOI":"10.1007\/978-1-4020-6046-5_2"},{"key":"9102_CR16","unstructured":"Hamon O, Hartley A, Popescu-Belis A, Choukri K (2007) Assessing human and automated quality judgments in the French MT evaluation campaign CESTA. In: MT summit XI, Copenhagen, Denmark, pp 231\u2013238"},{"key":"9102_CR17","doi-asserted-by":"crossref","unstructured":"Hasan S, Ney H (2009) Comparison of extended lexicon models in search and rescoring for SMT. In: HLT-NAACL 2009: short papers, Boulder, CO, pp 17\u201320","DOI":"10.3115\/1620853.1620859"},{"key":"9102_CR18","unstructured":"Hasan S, El Isbihani A, Ney H (2006) Creating a large-scale Arabic to French statistical machine translation system. In: International conference on language resources and evaluation, Genoa, Italy, pp 855\u2013858"},{"key":"9102_CR19","doi-asserted-by":"crossref","unstructured":"Hasan S, Ganitkevitch J, Ney H, Andr\u00e9s-Ferrer J (2008) Triplet lexicon models for statistical machine translation. In: EMNLP 2008, Honolulu, Hawaii, pp 372\u2013381","DOI":"10.3115\/1613715.1613764"},{"key":"9102_CR20","doi-asserted-by":"crossref","unstructured":"Kim W, Khudanpur S (2003) Cross-lingual lexical triggers in statistical language modeling. In: EMNLP 2003, Morristown, NJ, USA, pp 17\u201324","DOI":"10.21236\/ADA459581"},{"key":"9102_CR21","doi-asserted-by":"crossref","unstructured":"Lee YS (2004) Morphological analysis for statistical machine translation. In: HLT-NAACL \u201904: proceedings of HLT-NAACL 2004: short papers, Morristown, NJ, USA, pp 57\u201360","DOI":"10.3115\/1613984.1613999"},{"key":"9102_CR22","unstructured":"Maamouri M, Bies A, Buckwalter T, Mekki W (2004) The Penn Arabic Treebank: building a large-scale annotated Arabic corpus. In: NEMLAR conference on Arabic language resources and tools"},{"key":"9102_CR23","doi-asserted-by":"crossref","unstructured":"Mansour S, Sima\u2019an K, Winter Y (2007) Smoothing a lexicon-based POS tagger for Arabic and Hebrew. In: Semitic \u201907: proceedings of the 2007 workshop on computational approaches to semitic languages, Morristown, NJ, USA, pp 97\u2013103","DOI":"10.3115\/1654576.1654593"},{"key":"9102_CR24","doi-asserted-by":"crossref","unstructured":"Mauser A, Hasan S, Ney H (2009) Extending statistical machine translation with discriminative and trigger-based lexicon models. In: EMNLP 2009, Singapore, pp 210\u2013217","DOI":"10.3115\/1699510.1699538"},{"key":"9102_CR25","doi-asserted-by":"crossref","unstructured":"Nguyen T, Vogel S (2008) Context-based arabic morphological analysis for machine translation. In: CoNLL \u201908, Morristown, NJ, USA, pp 135\u2013142","DOI":"10.3115\/1596324.1596348"},{"key":"9102_CR26","unstructured":"NIST (2009) NIST open MT evaluation. http:\/\/www.itl.nist.gov\/iad\/mig\/tests\/mt\/2009\/"},{"key":"9102_CR27","unstructured":"QUAERO (2008) Automatic multimedia content processing. http:\/\/www.quaero.org\/"},{"issue":"2","key":"9102_CR28","doi-asserted-by":"crossref","first-page":"249","DOI":"10.1162\/089120101750300526","volume":"27","author":"B Roark","year":"2001","unstructured":"Roark B (2001) Probabilistic top-down parsing and language modeling. Comput Linguist 27(2): 249\u2013276","journal-title":"Comput Linguist"},{"issue":"3","key":"9102_CR29","doi-asserted-by":"crossref","first-page":"187","DOI":"10.1006\/csla.1996.0011","volume":"10","author":"R Rosenfeld","year":"1996","unstructured":"Rosenfeld R (1996) A maximum entropy approach to adaptive statistical language modeling. Comput Speech Lang 10(3): 187\u2013228","journal-title":"Comput Speech Lang"},{"key":"9102_CR30","unstructured":"Sadat F, Habash N (2006) Combination of preprocessing schemes for statistical MT. In: Proceedings of the 44th annual meeting of the Association for Computational Linguistics (ACL), Sydney, Australia, pp 1\u20138"},{"key":"9102_CR31","doi-asserted-by":"crossref","unstructured":"Smith NA, Smith DA, Tromble RW (2005) Context-based morphological disambiguation with random fields. In: HLT \/EMNLP\u201905, Morristown, NJ, USA, pp 475\u2013482","DOI":"10.3115\/1220575.1220635"},{"key":"9102_CR32","doi-asserted-by":"crossref","unstructured":"Stolcke A (2002) SRILM\u2014an extensible language modeling toolkit. In: Proceedings of the seventh international conference on spoken language processing, ISCA, Denver, CO, USA, pp 901\u2013904","DOI":"10.21437\/ICSLP.2002-303"},{"key":"9102_CR33","unstructured":"Tillmann C, Ney H (1997) Word triggers and the EM algorithm. In: Proceedings of the special interest group workshop on computational natural language learning (ACL), Madrid, Spain, pp 117\u2013124"},{"key":"9102_CR34","unstructured":"Zens R, Ney H (2008) Improvements in dynamic programming beam search for phrase-based statistical machine translation. In: International workshop on spoken language translation, Honolulu, Hawaii, pp 195\u2013205"}],"container-title":["Machine Translation"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10590-011-9102-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10590-011-9102-0\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10590-011-9102-0","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,11]],"date-time":"2025-03-11T19:18:20Z","timestamp":1741720700000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10590-011-9102-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011,9,22]]},"references-count":34,"journal-issue":{"issue":"1-2","published-print":{"date-parts":[[2012,3]]}},"alternative-id":["9102"],"URL":"https:\/\/doi.org\/10.1007\/s10590-011-9102-0","relation":{},"ISSN":["0922-6567","1573-0573"],"issn-type":[{"type":"print","value":"0922-6567"},{"type":"electronic","value":"1573-0573"}],"subject":[],"published":{"date-parts":[[2011,9,22]]}}}