{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,1,23]],"date-time":"2025-01-23T05:29:18Z","timestamp":1737610158013,"version":"3.33.0"},"reference-count":50,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2007,10,1]],"date-time":"2007-10-01T00:00:00Z","timestamp":1191196800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Front. Comput. Sc. China"],"published-print":{"date-parts":[[2007,10]]},"DOI":"10.1007\/s11704-007-0040-1","type":"journal-article","created":{"date-parts":[[2007,11,19]],"date-time":"2007-11-19T20:45:05Z","timestamp":1195505105000},"page":"413-428","source":"Crossref","is-referenced-by-count":3,"title":["Recent advances on NLP research in Harbin Institute of Technology"],"prefix":"10.1007","volume":"1","author":[{"given":"Tiejun","family":"Zhao","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yi","family":"Guan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ting","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qiang","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"issue":"1","key":"40_CR1","first-page":"50","volume":"13","author":"M. Zhang","year":"1994","unstructured":"Zhang M, Li S, Zhao T J, et al. Research on CEMT-III machine translation system from Chinese to English. Journal of the China Society for Scientific and Technical Information, 1994, 13(1): 50\u201363","journal-title":"Journal of the China Society for Scientific and Technical Information"},{"issue":"2","key":"40_CR2","first-page":"99","volume":"18","author":"E. D. Xun","year":"1999","unstructured":"Xun E D, Zhao T J. The selection method of translated text in BT863-II English-Chinese machine translation system. Journal of the China Society for Scientific and Technical Information, 1999, 18(2): 99\u2013104","journal-title":"Journal of the China Society for Scientific and Technical Information"},{"issue":"1","key":"40_CR3","first-page":"137","volume":"30","author":"W. Jiang","year":"2007","unstructured":"Jiang W, Wang X L, Guan Y, et al. Research on Chinese lexical analysis by fusing multiple knowledge sources. Chinese Journal of Computer, 2007, 30(1): 137\u2013145","journal-title":"Chinese Journal of Computer"},{"issue":"1","key":"40_CR4","first-page":"94","volume":"13","author":"W. Jiang","year":"2006","unstructured":"Jiang W, Wang X L, Guan Y, et al. Applying rough sets in word segmentation disambiguation based on maximum entropy model. Journal of Harbin Institute of Technology (New Series), 2006, 13(1): 94\u201398","journal-title":"Journal of Harbin Institute of Technology (New Series)"},{"issue":"4","key":"40_CR5","first-page":"393","volume":"11","author":"W. Jiang","year":"2006","unstructured":"Jiang W, Guan Y, Wang X L. A pragmatic Chinese word segmentation approach based on mixing models. International Journal of Computational Linguistics and Chinese Language Processing, 2006, 11(4): 393\u2013416","journal-title":"International Journal of Computational Linguistics and Chinese Language Processing"},{"key":"40_CR6","doi-asserted-by":"crossref","first-page":"2630","DOI":"10.1109\/ICMLC.2006.258916","volume":"4","author":"W. Jiang","year":"2006","unstructured":"Jiang W, Guan Y, Wang X L. Improving feature extraction in named entity recognition based on maximum entropy model. In: The 2006 International Conference on Machine Learning and Cybernetics. Dalian, 2006, 4: 2630\u20132635","journal-title":"The 2006 International Conference on Machine Learning and Cybernetics. Dalian"},{"key":"40_CR7","first-page":"667","volume":"4114","author":"W. Jiang","year":"2006","unstructured":"Jiang W, Guan Y, Wang X L. Conditional random fields based label sequence and information feedback. Lecture Notes in Artificial Intelligence, 2006, 4114: 667\u2013689","journal-title":"Lecture Notes in Artificial Intelligence"},{"key":"40_CR8","unstructured":"Sun H L, Yu S W. The survey of shallow parsing. The present linguistics, 2000, 63\u201373"},{"key":"40_CR9","unstructured":"Sang T K. Introduction to the CoNLL-2000 shared task: chunking. In: Proceedings of CoNLL-2000 and LLL-2000 conference. Lisbon, 2000, 127\u2013132"},{"key":"40_CR10","volume-title":"Dissertation for the Doctoral Degree","author":"Y. H. Liang","year":"2006","unstructured":"Liang Y H. Research on the technology of English and Chinese text chunking based on multi-agent strategy. Dissertation for the Doctoral Degree. Harbin: HIT, 2006"},{"key":"40_CR11","doi-asserted-by":"crossref","unstructured":"Liang Y H, Zhao T J. Distributed English text chunking using multi-agent based architecture. In: Proceedings of Mexican International Conference on Artificial Intelligence. Mexican, 2005, 752\u2013760","DOI":"10.1007\/11579427_76"},{"key":"40_CR12","volume-title":"Dissertation for the Doctoral Degree","author":"H. L. Cao","year":"2006","unstructured":"Cao H L. Research on Chinese syntactic parsing based on lexicalized statistical model. Dissertation for the Doctoral Degree. Harbin: HIT, 2006"},{"key":"40_CR13","volume-title":"Dissertation for the Doctoral Degree","author":"X. W. Han","year":"2006","unstructured":"Han X W. Research on automatic acquisition of Chinese verb subcategorization. Dissertation for the Doctoral Degree. Harbin: HIT, 2006"},{"key":"40_CR14","unstructured":"Cunningham H, Maynard D, Bontcheva K, et al. Gate: a frame-work and graphical development environment for robust NLP tools and applications. In: Proceedings of the 40th Anniversary Meeting of the Association for Computational Linguistics. Philadelphia, 2002, 168\u2013175"},{"key":"40_CR15","first-page":"214","volume-title":"Proceedings of the ACL demonstration session","author":"B. Steven","year":"2004","unstructured":"Steven B, Edward L. NLTK: the natural language toolkit. In: Proceedings of the ACL demonstration session. Barcelona: Association for Computational Linguistics, 2004, 214\u2013217"},{"key":"40_CR16","first-page":"252","volume-title":"Proceedings of the 33rd annual meeting on Association for Computational Linguistics","author":"K. Kevin","year":"1995","unstructured":"Kevin K, Hatzivassiloglou V. Two-level, many-paths generation. In: Proceedings of the 33rd annual meeting on Association for Computational Linguistics. Cambridge: Association for Computational Linguistics, 1995, 252\u2013260"},{"key":"40_CR17","unstructured":"Zhang H P, Liu T, Ma J S, et al. Chinese word segmentation with multiple postprocessors in HIT-IRLab. SIGHAN, 2005, 172\u2013175"},{"key":"40_CR18","unstructured":"Liao X T, Yu H B, Qin B, et al. Named entity recognition with the method of combining HMM with rules. In: Proceedings of Student Workshop of Computational Linguistics. Shen Yang, 2006 (in Chinese)"},{"key":"40_CR19","unstructured":"Lu Z M, Liu T, Zhang G, et al. Word sense disambiguation based on dependency relation ship analysis and Bayes model. Chinese High Technology Letters, 2003, (5): 1\u20137 (in Chinese)"},{"key":"40_CR20","unstructured":"Ma J S, Zhang Y, Liu T, et al. A statistical dependency parser of Chinese under small training data. In: The 1st International Joint Conference of Natural Language Processing, 2004"},{"key":"40_CR21","unstructured":"Liu H J, Che W X, Liu T. Feature engineering for Chinese semantic role labeling. In: Proceedings of Student Workshop of Computational Linguistics. Shen Yang, 2006, 75\u201380 (in Chinese)"},{"issue":"3","key":"40_CR22","first-page":"361","volume":"5","author":"D. D. Lewis","year":"2004","unstructured":"Lewis D D, Li F, Rose T, et al. RCV1: a new benchmark collection for text categorization research. Journal of Machine Learning Research, 2004, 5(3): 361\u2013397","journal-title":"Journal of Machine Learning Research"},{"key":"40_CR23","doi-asserted-by":"crossref","unstructured":"Ana C C, Arlindo L O. An empirical comparison of text categorization methods. In: Proceedings of the 10th International Symposium on String Processing and Information Retrieval. Manaus, 2003, 183\u2013196","DOI":"10.1007\/978-3-540-39984-1_14"},{"issue":"1","key":"40_CR24","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/505282.505283","volume":"34","author":"F. Sebastiani","year":"2002","unstructured":"Fabrizio Sebastiani. Machine learning in automated text categorization. ACM Computing Surveys, 2002, 34(1): 1\u201347","journal-title":"ACM Computing Surveys"},{"issue":"9","key":"40_CR25","doi-asserted-by":"crossref","first-page":"1848","DOI":"10.1360\/jos171848","volume":"17","author":"J. S. Su","year":"2006","unstructured":"Su J S, Zhang B F, Xu X. Advances in machine learning based text categorization. Journal of Software, 2006, 17(9): 1848\u20131859","journal-title":"Journal of Software"},{"issue":"1","key":"40_CR26","first-page":"113","volume":"6","author":"Q. Wang","year":"2006","unstructured":"Wang Q, Guan Y, Wang X L, et al. A novel feature selection method based on category information analysis for class prejudging in text classification. International Journal of Computer Science and Network Security, 2006, 6(1): 113\u2013119","journal-title":"International Journal of Computer Science and Network Security"},{"key":"40_CR27","first-page":"606","volume-title":"Lecture Notes in Artificial Intelligence (IJCNLP04)","author":"Q. Wang","year":"2005","unstructured":"Wang Q, Wang X L, Guan Y. A study of semi-discrete matrix decomposition for LSI in automated text categorization. In: Lecture Notes in Artificial Intelligence (IJCNLP04). Berlin: Springer Verlag, 2005, 3248: 606\u2013615"},{"key":"40_CR28","unstructured":"Wang Q, Wang X L Guan Y, et al. A research on text categorization based on the fusion of K-NN and SVM. Chinese High Technology Letters, 2005, (5): 19\u201324"},{"key":"40_CR29","unstructured":"Wang Q, Guan Y, Wang X L. A method for eliminating class noise in text classification based on feature class attribute. ACTA Automatica Sinica (in press)"},{"issue":"3","key":"40_CR30","first-page":"145","volume":"16","author":"Q. Wang","year":"2006","unstructured":"Wang Q, Guan Y, Wang X L. Explore efficient feature inference and compensation in text classification. Journal of Chinese Language and Computing, 2006, 16(3): 145\u2013156","journal-title":"Journal of Chinese Language and Computing"},{"key":"40_CR31","doi-asserted-by":"crossref","unstructured":"Wang Q, Guan Y, Wang X. SVM-based spam filter with active and online learning. In: Proceedings of the Fifteenth Text Retrieval Conference (TREC 2006). Gaithersburg, 2006","DOI":"10.6028\/NIST.SP.500-272.spam-harbin.zhao"},{"key":"40_CR32","unstructured":"Guan Y, Wang X L, Wang Q. Measurement of system similarity. In: Proceeding of JSCL-2005. Nanjing, 2005"},{"issue":"4","key":"40_CR33","first-page":"1581","volume":"3","author":"C. J. Sun","year":"2007","unstructured":"Sun C J, Guan Y, Wang X L, et al. Insuntourqa: a restricted-domain question answering system. Journal of Computational Information Systems, 2007, 3(4): 1581\u20131590","journal-title":"Journal of Computational Information Systems"},{"key":"40_CR34","doi-asserted-by":"crossref","unstructured":"Zhao Y M, Xu Z M, Guan Y, et al. An open domain question answering system based on improved system similarity model. In: Proceedings of ICMLC 2006. Dalian, 2006, 4521\u20134526","DOI":"10.1109\/ICMLC.2006.259170"},{"key":"40_CR35","doi-asserted-by":"crossref","unstructured":"Zhao Y M, Xu Z M, Guan Y, et al. Insun05QA on QA track of TREC2005. In: Proceeding of the Text REtrieval Conference 2005. Gettysburg, 2005","DOI":"10.6028\/NIST.SP.500-266.qa-hit.zhao"},{"key":"40_CR36","doi-asserted-by":"crossref","unstructured":"Zhao Y M, Xu Z M, Li P, et al. InsunQA06 on QA track of TREC2006. In: Proceeding of the Text REtrieval Conference 2006. Gettysburg, 2006","DOI":"10.6028\/NIST.SP.500-272.qa-harbin.zhao"},{"key":"40_CR37","unstructured":"Li P, Wang X L, Guan Y, et al. Extracting answers to natural language questions from large-scale corpus. In: Proceedings of 2005 IEEE International Conference on Natural Language Processing and Knowledge Engineering. Wuhan, 2005, 690\u2013694"},{"issue":"3","key":"40_CR38","first-page":"189","volume":"6","author":"P. Li","year":"2006","unstructured":"Li P, Wang X L, Guan Y, et al. Answer extraction based on system similarity model and stratified sampling logistic regression in rare date. International Journal of Computer Science and Network Security, 2006, 6(3): 189\u2013196","journal-title":"International Journal of Computer Science and Network Security"},{"key":"40_CR39","volume-title":"TongYiCi CiLin","author":"J. J. Mei","year":"1996","unstructured":"Mei J J. TongYiCi CiLin. Shanghai: Shanghai Cishu Publication Company, 1996"},{"key":"40_CR40","unstructured":"Dong Z D, Dong Q, Hownet. http:\/\/www.keenage.com"},{"key":"40_CR41","doi-asserted-by":"crossref","first-page":"64","DOI":"10.3115\/1626355.1626364","volume-title":"Proceedings of the Second Workshop on Statistical Machine Translation","author":"J. D. Sun","year":"2007","unstructured":"Sun J D, Zhao T J, Liang H S. Meta-structure transformation model for statistical machine translation. In: Proceedings of the Second Workshop on Statistical Machine Translation. Prague: Association for Computational Linguistics, 2007, 64\u201371"},{"key":"40_CR42","unstructured":"Xue Y Z, Li S, Zhao T J, et al. Syntax-based reordering model for phrasal statistical machine translation. Journal on Communications (to appear)"},{"key":"40_CR43","first-page":"487","volume-title":"Proceedings of the Annual Conference on Computer Graphics","author":"B. Coyne","year":"2001","unstructured":"Coyne B, Sproat R. WordsEye: An automatic text-to-scene conversion system. In: Proceedings of the Annual Conference on Computer Graphics. Los Angeles: ACM Press, 2001, 487\u2013496"},{"key":"40_CR44","unstructured":"Carsim. http:\/\/nlp.cs.lth.se\/carsim\/run\/webstart\/complete 2006"},{"key":"40_CR45","unstructured":"Anim N L. http:\/\/www.cis.upenn.edu\/:_cliff-group\/94\/animnl.html , 2007"},{"issue":"3","key":"40_CR46","first-page":"321","volume":"28","author":"R. Q. Lu","year":"2002","unstructured":"Lu R Q, Zhang S M. From story to animation: full life cycle computer aided animation generation. ACTA Automatica Sinica, 2002, 28(3): 321\u2013348","journal-title":"ACTA Automatica Sinica"},{"key":"40_CR47","doi-asserted-by":"crossref","unstructured":"Li H J, Zhao T J, Li S, et al. The extraction of spatial relationships from texts based on hybrid method. In: Proceedings of 2006 IEEE International Conference on Information Acquisition. Weihai, 2006","DOI":"10.1109\/ICIA.2006.306011"},{"key":"40_CR48","unstructured":"Li H J, Zhao T J, Li S. Graphic retrieval based on limited semantics. In: The IEEE International Conference on Natural Language Processing and Knowledge Engineering. Wuhan, 2005, 535\u2013539"},{"key":"40_CR49","unstructured":"Liu N S. Expression of the spatial relationship of objects in Chinese. Chinese Language, 1994, (3): 169\u2013179"},{"key":"40_CR50","unstructured":"Li H J, Zhao T J, Zhao J Y. The extraction of the trajectory from text based on linear classfication. In: The 16th Nordic Conference of Computational Linguistics. Tartu, Estonia, 2007"}],"container-title":["Frontiers of Computer Science in China"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11704-007-0040-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s11704-007-0040-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11704-007-0040-1","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,22]],"date-time":"2025-01-22T17:48:22Z","timestamp":1737568102000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s11704-007-0040-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2007,10]]},"references-count":50,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2007,10]]}},"alternative-id":["40"],"URL":"https:\/\/doi.org\/10.1007\/s11704-007-0040-1","relation":{},"ISSN":["1673-7350","1673-7466"],"issn-type":[{"type":"print","value":"1673-7350"},{"type":"electronic","value":"1673-7466"}],"subject":[],"published":{"date-parts":[[2007,10]]}}}