{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,5,31]],"date-time":"2025-05-31T20:10:03Z","timestamp":1748722203670,"version":"3.41.0"},"publisher-location":"Cham","reference-count":38,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319255903"},{"type":"electronic","value":"9783319255910"}],"license":[{"start":{"date-parts":[[2015,1,1]],"date-time":"2015-01-01T00:00:00Z","timestamp":1420070400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2015]]},"DOI":"10.1007\/978-3-319-25591-0_15","type":"book-chapter","created":{"date-parts":[[2015,12,14]],"date-time":"2015-12-14T15:55:51Z","timestamp":1450108551000},"page":"201-213","source":"Crossref","is-referenced-by-count":2,"title":["Multi-domain Adapted Machine Translation Using Unsupervised Text Clustering"],"prefix":"10.1007","author":[{"given":"Lars","family":"Bungum","sequence":"first","affiliation":[]},{"given":"Bj\u00f6rn","family":"Gamb\u00e4ck","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2015,12,15]]},"reference":[{"key":"15_CR1","unstructured":"Axelrod, A., He, X., Gao, J.: Domain adaptation via pseudo in-domain data selection. In: Proceedings of the Conference on Empirical Methods in Natural Language Processing, EMNLP 2011, Edinburgh, UK, pp. 355\u2013362. Association for Computational Linguistics (2011)"},{"key":"15_CR2","doi-asserted-by":"publisher","first-page":"93","DOI":"10.1016\/j.specom.2003.08.002","volume":"42","author":"JR Bellegarda","year":"2004","unstructured":"Bellegarda, J.R.: Statistical language model adaptation: review and perspectives. Speech Commun. 42, 93\u2013108 (2004)","journal-title":"Speech Commun."},{"key":"15_CR3","doi-asserted-by":"publisher","first-page":"7","DOI":"10.2478\/v10108-009-0011-9","volume":"91","author":"N Bertoldi","year":"2009","unstructured":"Bertoldi, N., Haddow, B., Fouet, J.-B.: Improved minimum error rate training in moses. Prague Bull. Math. Linguist. 91, 7\u201316 (2009)","journal-title":"Prague Bull. Math. Linguist."},{"issue":"2","key":"15_CR4","first-page":"79","volume":"16","author":"PF Brown","year":"1990","unstructured":"Brown, P.F., Cocke, J., Pietra, S.A.D., Pietra, V.J.D., Jelinek, F., Lafferty, J.D., Mercer, R.L., Roossin, P.S.: A statistical approach to machine translation. Comput. Linguist. 16(2), 79\u201385 (1990)","journal-title":"Comput. Linguist."},{"key":"15_CR5","unstructured":"Bungum, L., Gamb\u00e4ck, B.: A survey of domain adaptation in machine translation: towards a refinement of domain space. In: Proceedings of the India-Norway Workshop on Web Concepts and Technologies, Trondheim, Norway. Tapir Academic Press (2011)"},{"key":"15_CR6","unstructured":"Carpuat, M., Wu, D.: How phrase sense disambiguation outperforms word sense disambiguation for statistical machine translation. In: Proceedings of the 11th Conference on Theoretical and Methodological Issues in Machine Translation, pp. 43\u201352, September 2007"},{"key":"15_CR7","unstructured":"Carpuat, M., III, H.D., Fraser, A., Quirk, C., Braune, F., Clifton, A., Irvine, A., Jagarlamudi, J., Morgan, J., Razmara, M., Tamchyna, A., Henry, K., Rudinger, R.: Domain adaptation in machine translation: final report. In: 2012 Johns Hopkins Summer Workshop Final Report. Johns Hopkins University (2012)"},{"key":"15_CR8","unstructured":"Eck, M., Vogel, S., Waibel, A.: Language model adaptation for statistical machine translation based on information retrieval. In: Proceedings of the 4th International Conference on Language Resources and Evaluation, Lisbon, Portugal, May 2004, pp. 327\u2013330. ELRA (2004)"},{"key":"15_CR9","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"61","DOI":"10.1007\/978-3-642-40722-2_6","volume-title":"Language Processing and Knowledge in the Web","author":"G Faa\u00df","year":"2013","unstructured":"Faa\u00df, G., Eckart, K.: SdeWaC - a corpus of parsable sentences from the web. In: Biemann, C., Zesch, T., Gurevych, I. (eds.) GSCL 2013. LNCS, vol. 8105, pp. 61\u201368. Springer, Heidelberg (2013)"},{"key":"15_CR10","volume-title":"Data Mining: Concepts and Techniques","author":"J Han","year":"2005","unstructured":"Han, J.: Data Mining: Concepts and Techniques. Morgan Kaufmann Publishers Inc., San Francisco (2005)"},{"key":"15_CR11","unstructured":"Heafield, K.: KenLM: faster and smaller language model queries. In: Proceedings of the Sixth Workshop on Statistical Machine Translation, Edinburgh, Scotland, July 2011, pp. 187\u2013197. ACL (2011)"},{"key":"15_CR12","unstructured":"Hoang, H., Birch, A., Callison-burch, C., Zens, R., Aachen, R., Constantin, A., Federico, M., Bertoldi, N., Dyer, C., Cowan, B., Shen, W., Moran, C., Bojar, O.: Moses: open source toolkit for statistical machine translation. In: ACL, Prague, Czech Republic, June 2007, pp. 177\u2013180. Association for Computational Linguistics (2007)"},{"key":"15_CR13","doi-asserted-by":"publisher","first-page":"221","DOI":"10.1109\/97.611282","volume":"4","author":"R Iyer","year":"1997","unstructured":"Iyer, R., Ostendorf, M., Gish, H.: Using out-of-domain data to improve in-domain language models. IEEE Signal Process. Lett. 4, 221\u2013223 (1997)","journal-title":"IEEE Signal Process. Lett."},{"key":"15_CR14","unstructured":"Jiang, J.: Domain adaptation in natural language processing. University of Illinois at Urbana-Champaign (2008)"},{"issue":"3","key":"15_CR15","doi-asserted-by":"publisher","first-page":"348","DOI":"10.1016\/0953-5438(93)90015-L","volume":"5","author":"J Karlgren","year":"1993","unstructured":"Karlgren, J.: Sublanguages and registers - a note on terminology. Interact. Comput. 5(3), 348\u2013350 (1993)","journal-title":"Interact. Comput."},{"key":"15_CR16","unstructured":"Kay, M.: The proper place of men and machines in language translation. Technical Report CSL-80-11, Xerox Palo Alto Research Center, Palo Alto, California (1980)"},{"volume-title":"Sublanguage: Studies of Language in Restricted Semantic Domains","year":"1982","key":"15_CR17","unstructured":"Kittredge, R., Lehrberger, J. (eds.): Sublanguage: Studies of Language in Restricted Semantic Domains. W. de Gruyter, Berlin, New York (1982)"},{"key":"15_CR18","doi-asserted-by":"crossref","unstructured":"Koehn, P., Hoang, H., Birch, A., Callison-Burch, C., Federico, M., Bertoldi, N., Cowan, B., Shen, W., Moran, C., Zens, R., Dyer, C., Bojar, O., Constantin, A., Herbst, E.: Moses: open source toolkit for statistical machine translation. In: Proceedings of the 45th Annual Meeting of the ACL on Interactive Poster and Demonstration Sessions, ACL 2007, Stroudsburg, PA, USA, pp. 177\u2013180. Association for Computational Linguistics (2007)","DOI":"10.3115\/1557769.1557821"},{"key":"15_CR19","unstructured":"Koehn, P.: Europarl: a parallel corpus for statistical machine translation. In: Conference Proceedings: The Tenth Machine Translation Summit, Phuket, Thailand, pp. 79\u201386. AAMT (2005)"},{"key":"15_CR20","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"269","DOI":"10.1007\/3-540-61510-5_48","volume-title":"Artificial Neural Networks \u2014 ICANN 96","author":"T Kohonen","year":"1996","unstructured":"Kohonen, T., Kaski, S., Lagus, K., Honkela, T.: Very large two-level SOM for the browsing of newsgroups. In: von der Malsburg, C., von Seelen, W., Vorbr\u00fcggen, J.C., Sendhoff, B. (eds.) Artificial Neural Networks \u2014 ICANN 96. LNCS, vol. 1112, pp. 269\u2013274. Springer, Berlin (1996)"},{"issue":"3","key":"15_CR21","first-page":"574","volume":"11","author":"T Kohonen","year":"2000","unstructured":"Kohonen, T., Kaski, S., Lagus, K., Salojrvi, J., Paatero, V., Saarela, A.: Organization of a massive document collection. IEEE Trans. Neural Netw. Spec. Issue Neural Netw. Data Min. Knowl. Discov. 11(3), 574\u2013585 (2000)","journal-title":"IEEE Trans. Neural Netw. Spec. Issue Neural Netw. Data Min. Knowl. Discov."},{"issue":"1","key":"15_CR22","doi-asserted-by":"publisher","first-page":"59","DOI":"10.1007\/BF00337288","volume":"43","author":"T Kohonen","year":"1982","unstructured":"Kohonen, T.: Self-organized formation of topologically correct feature maps. Biol. Cybern. 43(1), 59\u201369 (1982)","journal-title":"Biol. Cybern."},{"issue":"1\u20133","key":"15_CR23","doi-asserted-by":"publisher","first-page":"135","DOI":"10.1016\/j.ins.2003.03.017","volume":"163","author":"K Lagus","year":"2004","unstructured":"Lagus, K., Kaski, S., Kohonen, T.: Mining massive document collections by the WEBSOM method. Inf. Sci. 163(1\u20133), 135\u2013156 (2004)","journal-title":"Inf. Sci."},{"issue":"8","key":"15_CR24","first-page":"707","volume":"10","author":"VI Levenshtein","year":"1966","unstructured":"Levenshtein, V.I.: Binary codes capable of correcting deletions, insertions and reversals. Sov. Phys. Dokl. 10(8), 707\u2013710 (1966)","journal-title":"Sov. Phys. Dokl."},{"key":"15_CR25","doi-asserted-by":"crossref","unstructured":"Louis, A., Webber, B.: Structured and unstructured cache models for SMT domain adaptation. In: Shuly Wintner, I., Stefan Riezler, G., Sharon Goldwater, U., (eds.) Proceedings of the 14th Conference of the European Chapter of the Association for Computational Linguistics, vol. 2: Short Papers, Gothenburg, Sweden, April 2014. Association for Computational Linguistics (2014)","DOI":"10.3115\/v1\/E14-1017"},{"key":"15_CR26","unstructured":"Lu, Y., Huang, J., Liu, Q.: Improving statistical machine translation performance by training data selection and optimization. In: Proceedings of the 2007 Joint Conference on Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP-CoNLL), Prague, Czech Republic, June 2007, pp. 343\u2013350. Association for Computational Linguistics (2007)"},{"key":"15_CR27","doi-asserted-by":"crossref","unstructured":"Mahajan, M., Beeferman, D., Huang, X.D.: Improved topic-dependent language modeling using information retrieval techniques. In: ICASSP (1999)","DOI":"10.1109\/ICASSP.1999.758182"},{"key":"15_CR28","unstructured":"Moore, R.C., Lewis, W.: Intelligent selection of language model training data. In: Proceedings of the 48th Annual Meeting of the Association for Computational Linguistics, volume Short papers, Uppsala, Sweden, July 2010, pp. 220\u2013224. ACL (2010)"},{"issue":"1","key":"15_CR29","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa, F., Varoquaux, G., Gramfort, A., Michel, V., Thirion, B., Grisel, O., Blondel, M., Prettenhofer, P., Weiss, R., Dubourg, V., Vanderplas, J., Passos, A., Cournapeau, D., Brucher, M., Perrot, M., Duchesnay, \u00c9.: Scikit-learn: machine learning in Python. J. Mach. Learn. Res. 12(1), 2825\u20132830 (2011)","journal-title":"J. Mach. Learn. Res."},{"key":"15_CR30","unstructured":"Plank, B.: Domain adaptation for parsing. Ph.D. thesis, University of Groningen (2011)"},{"key":"15_CR31","doi-asserted-by":"crossref","unstructured":"Price, P.J.: Evaluation of spoken language systems: the ATIS domain. In: Proceedings of the Workshop on Speech and Natural Language, HLT 1990, Stroudsburg, PA, USA, pp. 91\u201395. Association for Computational Linguistics (1990)","DOI":"10.3115\/116580.116612"},{"key":"15_CR32","doi-asserted-by":"publisher","first-page":"187","DOI":"10.1006\/csla.1996.0011","volume":"10","author":"R Rosenfeld","year":"1996","unstructured":"Rosenfeld, R.: A maximum entropy approach to adaptive statistical language modeling. Comput. Speech Lang. 10, 187\u2013228 (1996)","journal-title":"Comput. Speech Lang."},{"key":"15_CR33","doi-asserted-by":"publisher","first-page":"1270","DOI":"10.1109\/5.880083","volume":"88","author":"R Rosenfeld","year":"2000","unstructured":"Rosenfeld, R.: Two decades of statistical language modeling: where do we go from here. Proc. IEEE 88, 1270\u20131278 (2000)","journal-title":"Proc. IEEE"},{"key":"15_CR34","unstructured":"Salvador, S., Chan, P.: Determining the number of clusters\/segments in hierarchical clustering\/segmentation algorithms. In: ICTAI, pp. 576\u2013584. IEEE Computer Society (2004)"},{"key":"15_CR35","unstructured":"Sennrich, R., Schwenk, H., Aransa, W.: A multi-domain translation model framework for statistical machine translation. In: ACL (1), pp. 832\u2013840. The Association for Computer Linguistics (2013)"},{"key":"15_CR36","unstructured":"Sennrich, R.: Combining multi-engine machine translation and online learning through dynamic phrase tables. In: EAMT 2011: The 15th Annual Conference of the European Association for Machine Translation, Leuven, Belgium, May 2011. European Association for Machine Translation (2011)"},{"key":"15_CR37","unstructured":"Tiedemann, J.: Parallel data, tools and interfaces in OPUS. In: Chair, N.C.C., Choukri, K., Declerck, T., Dogan, M.U., Maegaard, B., Mariani, J., Odijk, J., Piperidis, S. (eds.) Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC 2012), Istanbul, Turkey, May 2012. European Language Resources Association (ELRA) (2012)"},{"key":"15_CR38","doi-asserted-by":"crossref","unstructured":"Wang, L., Wong, D.F., Chao, L.S., Lu, Y., Xing, J.: A systematic comparison of data selection criteria for smt domain adaptation. Sc. World J. 2014(1) (2014)","DOI":"10.1155\/2014\/745485"}],"container-title":["Lecture Notes in Computer Science","Modeling and Using Context"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-25591-0_15","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,31]],"date-time":"2025-05-31T19:46:56Z","timestamp":1748720816000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-25591-0_15"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015]]},"ISBN":["9783319255903","9783319255910"],"references-count":38,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-25591-0_15","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2015]]}}}