{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T10:29:42Z","timestamp":1742984982616,"version":"3.40.3"},"publisher-location":"Berlin, Heidelberg","reference-count":22,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642201271"},{"type":"electronic","value":"9783642201288"}],"license":[{"start":{"date-parts":[[2013,1,1]],"date-time":"2013-01-01T00:00:00Z","timestamp":1356998400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2013,1,1]],"date-time":"2013-01-01T00:00:00Z","timestamp":1356998400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2013]]},"DOI":"10.1007\/978-3-642-20128-8_7","type":"book-chapter","created":{"date-parts":[[2013,12,13]],"date-time":"2013-12-13T12:15:18Z","timestamp":1386936918000},"page":"131-149","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["Exploiting Comparable Corpora for Lexicon Extraction: Measuring and Improving Corpus Quality"],"prefix":"10.1007","author":[{"given":"Bo","family":"Li","sequence":"first","affiliation":[]},{"given":"Eric","family":"Gaussier","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2013,12,14]]},"reference":[{"key":"7_CR1","doi-asserted-by":"crossref","unstructured":"Ballesteros, L., Croft, W.B.: Phrasal translation and query expansion techniques for cross-language information retrieval. In: Proceedings of the 20th ACM SIGIR, pp. 84\u201391, Philadelphia, Pennsylvania, USA (1997)","DOI":"10.1145\/278459.258540"},{"key":"7_CR2","doi-asserted-by":"crossref","unstructured":"D\u00e9jean, H., Gaussier, E., Sadat, F.: An approach based on multilingual thesauri and model combination for bilingual lexicon extraction. In: Proceedings of the 19th International Conference on Computational Linguistics, pp. 1\u20137, Taipei, Taiwan (2002)","DOI":"10.3115\/1072228.1072394"},{"key":"7_CR3","unstructured":"Fung, P., McKeown, K.: Finding terminology translations from non-parallel corpora. In: Proceedings of the 5th Annual Workshop on Very Large Corpora, pp. 192\u2013202, Hong Kong (1997)"},{"key":"7_CR4","doi-asserted-by":"crossref","unstructured":"Fung, P., Yee, L.Y.: An IR approach for translating new words from nonparallel, comparable texts. In: Proceedings of the 17th International Conference on Computational linguistics, pp. 414\u2013420, Montreal, Quebec, Canada (1998)","DOI":"10.3115\/980451.980916"},{"key":"7_CR5","doi-asserted-by":"crossref","unstructured":"Garera, N., Callison-Burch, C., Yarowsky, D.: Improving translation lexicon induction from monolingual corpora via dependency contexts and part-of-speech equivalences. In: CoNLL 09: Proceedings of the Thirteenth Conference on Computational Natural Language Learning, pp. 129\u2013137, Boulder, Colorado (2009)","DOI":"10.3115\/1596374.1596397"},{"key":"7_CR6","doi-asserted-by":"crossref","unstructured":"Gaussier, E., Renders, J.M., Matveeva, I., Goutte, C., D\u00e9jean, H.: A geometric view on bilingual lexicon extraction from comparable corpora. In: Proceedings of the 42nd Annual Meeting of the Association for Computational Linguistics, pp. 526\u2013533, Barcelona, Spain (2004)","DOI":"10.3115\/1218955.1219022"},{"key":"7_CR7","unstructured":"Goeuriot, L., Grabar, N., Daille, B.: Characterization of scientific and popular science discourse in French, Japanese and Russian. In: LREC. Marrakech, Morocco (2008)"},{"key":"7_CR8","unstructured":"Koehn, P.: Europarl: a parallel corpus for statistical machine translation. In: Proceedings of MT Summit (2005)"},{"key":"7_CR9","unstructured":"Laroche, A., Langlais, P.: Revisiting context-based projection methods for term-translation spotting in comparable corpora. In: Proceedings of the 23rd International Conference on Computational Linguistics (Coling 2010), pp. 617\u2013625, Beijing, China (Aug 2010)"},{"key":"7_CR10","unstructured":"Li, B., Gaussier, E.: Improving corpus comparability for bilingual lexicon extraction from comparable corpora. In: Proceedings of the 23rd International Conference on Computational Linguistics, pp. 644\u2013652, Beijing, China (2010)"},{"key":"7_CR11","unstructured":"Li, B., Gaussier, E., Aizawa, A.: Clustering comparable corpora for bilingual lexicon extraction. In: Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies, pp. 473\u2013478, Portland, Oregon, USA (June 2011)"},{"key":"7_CR12","unstructured":"Morin, E., Daille, B., Takeuchi, K., Kageura, K.: Bilingual terminology mining\u2014using brain, not brawn comparable corpora. In: Proceedings of the 45th Annual Meeting of the Association for Computational Linguistics, pp. 664\u2013671, Prague, Czech Republic (2007)"},{"key":"7_CR13","doi-asserted-by":"crossref","unstructured":"Munteanu, D.S., Marcu, D.: Extracting parallel sub-sentential fragments from non-parallel corpora. In: Proceedings of the 21st International Conference on Computational Linguistics and the 44th annual meeting of the Association for Computational Linguistics, pp. 81\u201388, Sydney, Australia (2006)","DOI":"10.3115\/1220175.1220186"},{"issue":"1","key":"7_CR14","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1162\/089120103321337421","volume":"29","author":"FJ Och","year":"2003","unstructured":"Och, F.J., Ney, H.: A systematic comparison of various statistical alignment models. Comput. Linguist. 29(1), 19\u201351 (2003)","journal-title":"Comput. Linguist."},{"issue":"4","key":"7_CR15","doi-asserted-by":"publisher","first-page":"247","DOI":"10.1007\/s10590-007-9029-7","volume":"20","author":"V Pekar","year":"2006","unstructured":"Pekar, V., Mitkov, R., Blagoev, D., Mulloni, A.: Finding translations for low-frequency words in comparable corpora. Mach. Transl. 20(4), 247\u2013266 (2006)","journal-title":"Mach. Transl."},{"key":"7_CR16","doi-asserted-by":"crossref","unstructured":"Rapp, R.: Automatic identification of word translations from unrelated English and German corpora. In: Proceedings of the 37th Annual Meeting of the Association for Computational Linguistics, pp. 519\u2013526, College Park, Maryland, USA (1999)","DOI":"10.3115\/1034678.1034756"},{"key":"7_CR17","doi-asserted-by":"crossref","unstructured":"Rayson, P., Garside, R.: Comparing corpora using frequency profiling. In: Proceedings of the Workshop on Comparing corpora, pp. 1\u20136, Hong Kong (2000)","DOI":"10.3115\/1117729.1117730"},{"key":"7_CR18","unstructured":"Robitaille, X., Sasaki, Y., Tonoike, M., Sato, S., Utsuro, T.: Compiling French-Japanese terminologies from the web. In: Proceedings of the 11th Conference of the European Chapter of the Association for Computational Linguistics, pp. 225\u2013232, Trento, Italy (2006)"},{"key":"7_CR19","unstructured":"Sharoff, S.: Comparing corpora using frequency profiling. In: Proceedings of Web as Corpus Workshop. Louvain-la-Neuve (2007)"},{"key":"7_CR20","unstructured":"Shezaf, D., Rappoport, A.: Bilingual lexicon generation using non-aligned signatures. In: Proceedings of the 48th Annual Meeting of the Association for Computational Linguistics, pp. 98\u2013107, Uppsala, Sweden (2010)"},{"key":"7_CR21","doi-asserted-by":"crossref","unstructured":"Voorhees, E.M.: The trec-8 question answering track report. In: Proceedings of the 8th Text Retrieval Conference, pp. 77\u201382 (1999)","DOI":"10.6028\/NIST.SP.500-246"},{"key":"7_CR22","doi-asserted-by":"crossref","unstructured":"Yu, K., Tsujii, J.: Extracting bilingual dictionary from comparable corpora with dependency heterogeneity. In: Proceedings of HLT-NAACL 2009, pp. 121\u2013124, Boulder, Colorado, USA (2009)","DOI":"10.3115\/1620853.1620888"}],"container-title":["Building and Using Comparable Corpora"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-20128-8_7","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,8]],"date-time":"2023-07-08T23:37:11Z","timestamp":1688859431000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-642-20128-8_7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013]]},"ISBN":["9783642201271","9783642201288"],"references-count":22,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-20128-8_7","relation":{},"subject":[],"published":{"date-parts":[[2013]]},"assertion":[{"value":"14 December 2013","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}