{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,8]],"date-time":"2026-04-08T11:28:05Z","timestamp":1775647685505,"version":"3.50.1"},"reference-count":54,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2012,6,7]],"date-time":"2012-06-07T00:00:00Z","timestamp":1339027200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Mach Learn"],"published-print":{"date-parts":[[2012,9]]},"DOI":"10.1007\/s10994-012-5296-5","type":"journal-article","created":{"date-parts":[[2012,6,6]],"date-time":"2012-06-06T17:00:50Z","timestamp":1339002050000},"page":"399-431","source":"Crossref","is-referenced-by-count":47,"title":["Structured learning with constrained conditional models"],"prefix":"10.1007","volume":"88","author":[{"given":"Ming-Wei","family":"Chang","sequence":"first","affiliation":[]},{"given":"Lev","family":"Ratinov","sequence":"additional","affiliation":[]},{"given":"Dan","family":"Roth","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2012,6,7]]},"reference":[{"key":"5296_CR1","volume-title":"Proceedings of HLT\/NAACL","author":"R. Barzilay","year":"2006","unstructured":"Barzilay, R., & Lapata, M. (2006). Aggregation via set partitioning for natural language generation. In Proceedings of HLT\/NAACL, June 2006."},{"key":"5296_CR2","volume-title":"Proceedings of uncertainty in artificial intelligence (UAI)","author":"K. Bellare","year":"2009","unstructured":"Bellare, K., Druck, G., & McCallum, A. (2009). Alternating projections for learning with expectation constraints. In Proceedings of uncertainty in artificial intelligence (UAI)."},{"key":"5296_CR3","first-page":"92","volume-title":"Proceedings of the annual ACM workshop on computational learning theory (COLT)","author":"A. Blum","year":"1998","unstructured":"Blum, A., & Mitchell, T. (1998). Combining labeled and unlabeled data with co-training. In Proceedings of the annual ACM workshop on computational learning theory (COLT) (pp. 92\u2013100)."},{"key":"5296_CR4","unstructured":"Borman, S. (2004). The expectation maximization algorithm\u2014a\u00a0short tutorial. Introduces the Expectation Maximization (EM) algorithm and fleshes out the basic mathematical results, including a proof of convergence. The Generalized EM algorithm is also introduced, July 2004."},{"key":"5296_CR5","volume-title":"Proceedings of the third ACM international conference on web search and data mining","author":"A. Carlson","year":"2010","unstructured":"Carlson, A., Betteridge, J., Wang, R. C., Hruschka, E. R. Jr., & Mitchell, T. M. (2010). Coupled semi-supervised learning for information extraction. In Proceedings of the third ACM international conference on web search and data mining."},{"key":"5296_CR6","first-page":"280","volume-title":"Proceedings of the annual meeting of the association for computational linguistics (ACL)","author":"M. Chang","year":"2007","unstructured":"Chang, M., Ratinov, L., & Roth, D. (2007). Guiding semi-supervision with constraint-driven learning. In Proceedings of the annual meeting of the association for computational linguistics (ACL), Prague, Czech Republic, June 2007 (pp. 280\u2013287). New York: Association for Computational Linguistics."},{"key":"5296_CR7","first-page":"173","volume-title":"Proceedings of the annual meeting of the association for computational linguistics (ACL)","author":"E. Charniak","year":"2005","unstructured":"Charniak, E., & Johnson, M. (2005). Coarse-to-fine n-best parsing and maxent discriminative reranking. In Proceedings of the annual meeting of the association for computational linguistics (ACL), Ann Arbor, Michigan (pp. 173\u2013180). New York: ACL."},{"key":"5296_CR8","first-page":"144","volume-title":"Proceedings of the annual meeting of the association for computational linguistics (ACL)","author":"J. Clarke","year":"2006","unstructured":"Clarke, J., & Lapata, M. (2006). Constraint-based sentence compression: an integer programming approach. In Proceedings of the annual meeting of the association for computational linguistics (ACL), Sydney, Australia, July 2006 (pp. 144\u2013151). New York: ACL."},{"key":"5296_CR9","first-page":"89","volume-title":"Proceedings of international conference on knowledge discovery and data mining (KDD)","author":"W. Cohen","year":"2004","unstructured":"Cohen, W. (2004). Exploiting dictionaries in named entity extraction: combining semi-Markov extraction processes and data integration methods. In Proceedings of international conference on knowledge discovery and data mining (KDD) (pp. 89\u201398)."},{"key":"5296_CR10","first-page":"175","volume-title":"Proceedings of the 17th international conference on machine learning","author":"M. Collins","year":"2000","unstructured":"Collins, M. (2000). Discriminative reranking for natural language parsing. In Proceedings of the 17th international conference on machine learning (pp. 175\u2013182). San Francisco: Morgan Kaufmann."},{"key":"5296_CR11","volume-title":"Proceedings of the conference on empirical methods for natural language processing (EMNLP)","author":"M. Collins","year":"2002","unstructured":"Collins, M. (2002). Discriminative training methods for hidden Markov models: theory and experiments with perceptron algorithms. In Proceedings of the conference on empirical methods for natural language processing (EMNLP)."},{"key":"5296_CR12","volume-title":"Proceedings of the conference on empirical methods for natural language processing (EMNLP)","author":"M. Collins","year":"1999","unstructured":"Collins, M., & Singer, Y. (1999). Unsupervised models for named entity classification. In Proceedings of the conference on empirical methods for natural language processing (EMNLP)."},{"key":"5296_CR13","doi-asserted-by":"crossref","first-page":"837","DOI":"10.1145\/1645953.1646059","volume-title":"Proceedings of ACM conference on information and knowledge management (CIKM)","author":"K. Collins-Thompson","year":"2009","unstructured":"Collins-Thompson, K. (2009). Reducing the risk of query expansion via robust constrained optimization. In Proceedings of ACM conference on information and knowledge management (CIKM) (pp. 837\u2013846)."},{"key":"5296_CR14","first-page":"99","volume-title":"Proceedings of the international conference on machine learning (ICML)","author":"F. G. Cozman","year":"2003","unstructured":"Cozman, F. G., Cohen, I., & Cirelo, M. C. (2003). Semi-supervised learning of mixture models. In Proceedings of the international conference on machine learning (ICML) (pp. 99\u2013106)."},{"key":"5296_CR15","volume-title":"Proceedings of the international conference on machine learning (ICML)","author":"H. Daum\u00e9","year":"2005","unstructured":"Daum\u00e9, H., & Marcu, D. (2005). Learning as search optimization: approximate large margin methods for structured prediction. In Proceedings of the international conference on machine learning (ICML), Bonn, Germany, 2005."},{"key":"5296_CR16","first-page":"120","volume-title":"Proceedings of AUAI","author":"R. Dechter","year":"2004","unstructured":"Dechter, R., & Mateescu, R. (2004). Mixtures of deterministic-probabilistic networks and their AND\/OR search space. In Proceedings of AUAI, Arlington, VA, USA, 2004 (pp. 120\u2013129). New York: AUAI Press."},{"key":"5296_CR17","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1111\/j.2517-6161.1977.tb01600.x","volume":"39","author":"A. P. Dempster","year":"1977","unstructured":"Dempster, A. P., Laird, N. M., & Rubin, D. B. (1977). Maximum likelihood from incomplete data via the EM algorithm. Journal of the Royal Statistical Society, 39, 1\u201338.","journal-title":"Journal of the Royal Statistical Society"},{"key":"5296_CR18","volume-title":"Proceedings of the annual meeting of the North American association of computational linguistics (NAACL)","author":"P. Denis","year":"2007","unstructured":"Denis, P., & Baldridge, J. (2007). Joint determination of anaphoricity and coreference resolution using integer programming. In Proceedings of the annual meeting of the North American association of computational linguistics (NAACL)."},{"key":"5296_CR19","first-page":"363","volume-title":"Proceedings of the annual meeting of the association for computational linguistics (ACL)","author":"J. R. Finkel","year":"2005","unstructured":"Finkel, J. R., Grenager, T., & Manning, C. (2005). Incorporating non-local information into information extraction systems by Gibbs sampling. In Proceedings of the annual meeting of the association for computational linguistics (ACL), Morristown, NJ, USA, 2005 (pp. 363\u2013370). New York: Association for Computational Linguistics."},{"key":"5296_CR20","first-page":"1300","volume-title":"Proceedings of the international joint conference on artificial intelligence (IJCAI)","author":"N. Friedman","year":"1999","unstructured":"Friedman, N., Getoor, L., Koller, D., & Pfeffer, A. (1999). Learning probabilistic relational models. In Proceedings of the international joint conference on artificial intelligence (IJCAI) (pp. 1300\u20131309)."},{"key":"5296_CR21","unstructured":"Ganchev, K., Gra\u00e7a, J., Gillenwater, J., & Taskar, B. (2010). Posterior regularization for structured latent variable models. Journal of Machine Learning Research."},{"key":"5296_CR22","volume-title":"NIPS","author":"J. V. Graca","year":"2007","unstructured":"Graca, J. V., Ganchev, K., & Taskar, B. (2007). Expectation maximization and posterior constraints. In NIPS (Vol.\u00a020)."},{"key":"5296_CR23","volume-title":"Proceedings of the annual meeting of the association for computational linguistics","author":"T. Grenager","year":"2005","unstructured":"Grenager, T., Klein, D., & Manning, C. (2005). Unsupervised learning of field segmentation models for information extraction. In Proceedings of the annual meeting of the association for computational linguistics. New York: ACL."},{"key":"5296_CR24","volume-title":"Proceedings of HTL-NAACL","author":"A. Haghighi","year":"2006","unstructured":"Haghighi, A., & Klein, D. (2006). Prototype-driven learning for sequence models. In Proceedings of HTL-NAACL."},{"key":"5296_CR25","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1049\/cp:19991075","volume-title":"Proceedings of the 9th international conference on artificial neural networks (ICANN99)","author":"G. Hinton","year":"1999","unstructured":"Hinton, G. (1999). Products of experts. In Proceedings of the 9th international conference on artificial neural networks (ICANN99) (pp. 1\u20136)."},{"key":"5296_CR26","volume-title":"Proceedings of the annual meeting of the association for computational linguistics (ACL)","author":"L. Huang","year":"2008","unstructured":"Huang, L. (2008). Forest reranking: discriminative parsing with non-local features. In Proceedings of the annual meeting of the association for computational linguistics (ACL)."},{"key":"5296_CR27","first-page":"266","volume-title":"Proceedings of the 13th conference on uncertainty in artificial intelligence","author":"M. Jaeger","year":"1997","unstructured":"Jaeger, M. (1997). Relational Bayesian networks. In M. Kaufmann (Ed.), Proceedings of the 13th conference on uncertainty in artificial intelligence (pp. 266\u2013273)."},{"key":"5296_CR28","first-page":"315","volume-title":"Proceedings of the 2007 joint conference of EMNLP-CoNLL","author":"J. Kazama","year":"2007","unstructured":"Kazama, J., & Torisawa, K. (2007). A\u00a0new perceptron algorithm for sequence labeling with non-local features. In Proceedings of the 2007 joint conference of EMNLP-CoNLL (pp. 315\u2013324)."},{"key":"5296_CR29","first-page":"138","volume-title":"Proceedings of the work-in-progress track at the 10th international conference on inductive logic programming","author":"K. Kersting","year":"2000","unstructured":"Kersting, K., & Raedt, L. D. (2000). Bayesian logic programs. In J. Cussens & A. Frisch (Eds.), Proceedings of the work-in-progress track at the 10th international conference on inductive logic programming (pp.\u00a0138\u2013155)."},{"key":"5296_CR30","volume-title":"Proceedings of the international conference on machine learning (ICML)","author":"J. Lafferty","year":"2001","unstructured":"Lafferty, J., McCallum, A., & Pereira, F. (2001). Conditional random fields: probabilistic models for segmenting and labeling sequence data. In Proceedings of the international conference on machine learning (ICML)."},{"key":"5296_CR31","volume-title":"Proceedings of the international conference on machine learning (ICML)","author":"P. Liang","year":"2009","unstructured":"Liang, P., Jordan, M. I., & Klein, D. (2009). Learning from measurements in exponential families. In Proceedings of the international conference on machine learning (ICML)."},{"key":"5296_CR32","volume-title":"Proceedings of the annual meeting of the association for computational linguistics (ACL)","author":"P. Liang","year":"2008","unstructured":"Liang, P., & Klein, D. (2008). Analyzing the errors of unsupervised learning. In Proceedings of the annual meeting of the association for computational linguistics (ACL)."},{"key":"5296_CR33","first-page":"870","volume-title":"Proceedings of the annual meeting of the association for computational linguistics (ACL)","author":"G. Mann","year":"2008","unstructured":"Mann, G., & McCallum, A. (2008). Generalized expectation criteria for semi-supervised learning of conditional random fields. In Proceedings of the annual meeting of the association for computational linguistics (ACL) (pp. 870\u2013878)."},{"key":"5296_CR34","doi-asserted-by":"crossref","first-page":"136","DOI":"10.3115\/1706543.1706568","volume-title":"Proceedings of the annual conference on computational natural language learning (CoNLL)","author":"T. Marciniak","year":"2005","unstructured":"Marciniak, T., & Strube, M. (2005). Beyond the pipeline: discrete optimization in NLP. In Proceedings of the annual conference on computational natural language learning (CoNLL), Ann Arbor, MI, June 2005 (pp. 136\u2013143). New York: Association for Computational Linguistics."},{"key":"5296_CR35","volume-title":"Proceedings of the international conference on machine learning (ICML)","author":"A. McCallum","year":"2000","unstructured":"McCallum, A., Freitag, D., & Pereira, F. (2000). Maximum entropy Markov models for information extraction and segmentation. In Proceedings of the international conference on machine learning (ICML)."},{"key":"5296_CR36","volume-title":"Proceedings of the international conference on acoustics, speech, and signal processing","author":"B. Merialdo","year":"1991","unstructured":"Merialdo, B. (1991). Tagging text with a probabilistic model. In Proceedings of the international conference on acoustics, speech, and signal processing."},{"key":"5296_CR37","first-page":"841","volume-title":"The conference on advances in neural information processing systems (NIPS)","author":"A. Y. Ng","year":"2001","unstructured":"Ng, A. Y., & Jordan, M. I. (2001). On discriminative vs. generative classifiers: a\u00a0comparison of logistic regression and naive Bayes. In The conference on advances in neural information processing systems (NIPS) (pp. 841\u2013848)."},{"key":"5296_CR38","first-page":"286","volume-title":"Asian computing science conference","author":"L. Ngo","year":"1995","unstructured":"Ngo, L., & Haddawy, P. (1995). Probabilistic logic programming and Bayesian networks. In Asian computing science conference (pp. 286\u2013300)."},{"issue":"2\/3","key":"5296_CR39","doi-asserted-by":"crossref","first-page":"103","DOI":"10.1023\/A:1007692713085","volume":"39","author":"K. Nigam","year":"2000","unstructured":"Nigam, K., Mccallum, A., Thrun, S., & Mitchell, T. (2000). Text classification from labeled and unlabeled documents using EM. Machine Learning, 39(2\/3), 103\u2013134.","journal-title":"Machine Learning"},{"key":"5296_CR40","first-page":"1117","volume-title":"Proceedings of the international joint conference on artificial intelligence (IJCAI)","author":"V. Punyakanok","year":"2005","unstructured":"Punyakanok, V., Roth, D., & Yih, W. (2005a). The necessity of syntactic parsing for semantic role labeling. In Proceedings of the international joint conference on artificial intelligence (IJCAI) (pp. 1117\u20131123)."},{"key":"5296_CR41","first-page":"1124","volume-title":"Proceedings of the international joint conference on artificial intelligence (IJCAI)","author":"V. Punyakanok","year":"2005","unstructured":"Punyakanok, V., Roth, D., Yih, W., & Zimak, D. (2005b). Learning and inference over constrained output. In Proceedings of the international joint conference on artificial intelligence (IJCAI) (pp. 1124\u20131129)."},{"issue":"2","key":"5296_CR42","doi-asserted-by":"crossref","first-page":"257","DOI":"10.1162\/coli.2008.34.2.257","volume":"34","author":"V. Punyakanok","year":"2008","unstructured":"Punyakanok, V., Roth, D., & Yih, W. (2008). The importance of syntactic parsing and inference in semantic role labeling. Computational Linguistics, 34(2), 257\u2013287.","journal-title":"Computational Linguistics"},{"issue":"1","key":"5296_CR43","doi-asserted-by":"crossref","first-page":"4","DOI":"10.1109\/MASSP.1986.1165342","volume":"3","author":"L. R. Rabiner","year":"1986","unstructured":"Rabiner, L. R., & Juang, B. H. (1986). An introduction to hidden Markov models. IEEE ASSP Magazine, 3(1), 4\u201316.","journal-title":"IEEE ASSP Magazine"},{"issue":"1\u20132","key":"5296_CR44","doi-asserted-by":"crossref","first-page":"107","DOI":"10.1007\/s10994-006-5833-1","volume":"62","author":"M. Richardson","year":"2006","unstructured":"Richardson, M., & Domingos, P. (2006). Markov logic networks. Machine Learning Journal, 62(1\u20132), 107\u2013136.","journal-title":"Machine Learning Journal"},{"key":"5296_CR45","doi-asserted-by":"crossref","first-page":"597","DOI":"10.1109\/ICSC.2007.53","volume-title":"Proceedings of the first international conference on semantic computing (ICSC)","author":"N. Rizzolo","year":"2007","unstructured":"Rizzolo, N., & Roth, D. (2007). Modeling Discriminative Global Inference. In Proceedings of the first international conference on semantic computing (ICSC), Irvine, CA, September 2007 (pp. 597\u2013604). New York: IEEE."},{"key":"5296_CR46","first-page":"898","volume-title":"Proceedings of the international joint conference on artificial intelligence (IJCAI)","author":"D. Roth","year":"1999","unstructured":"Roth, D. (1999). Learning in natural language. In Proceedings of the international joint conference on artificial intelligence (IJCAI) (pp. 898\u2013904)."},{"key":"5296_CR47","first-page":"1","volume-title":"Proceedings of the annual conference on computational natural language learning (CoNLL)","author":"D. Roth","year":"2004","unstructured":"Roth, D., & Yih, W. (2004). A\u00a0linear programming formulation for global inference in natural language tasks. In H. T. Ng & E. Riloff (Eds.), Proceedings of the annual conference on computational natural language learning (CoNLL) (pp. 1\u20138). New York: Association for Computational Linguistics."},{"key":"5296_CR48","first-page":"737","volume-title":"Proceedings of the international conference on machine learning (ICML)","author":"D. Roth","year":"2005","unstructured":"Roth, D., & Yih, W. (2005). Integer linear programming inference for conditional random fields. In Proceedings of the international conference on machine learning (ICML) (pp. 737\u2013744)."},{"key":"5296_CR49","volume-title":"Introduction to statistical relational learning","author":"D. Roth","year":"2007","unstructured":"Roth, D., & Yih, W. (2007). Global inference for entity and relation identification via a linear programming formulation. In L. Getoor & B. Taskar (Eds.), Introduction to statistical relational learning. Cambridge: MIT Press."},{"key":"5296_CR50","first-page":"1185","volume-title":"The conference on advances in neural information processing systems (NIPS)","author":"S. Sarawagi","year":"2004","unstructured":"Sarawagi, S., & Cohen, W. (2004). Semi-Markov conditional random fields for information extraction. In The conference on advances in neural information processing systems (NIPS) (pp. 1185\u20131192)."},{"key":"5296_CR51","volume-title":"Proceedings of the conference on empirical methods for natural language processing (EMNLP)","author":"M. Thelen","year":"2002","unstructured":"Thelen, M., & Riloff, E. (2002). A\u00a0bootstrapping method for learning semantic lexicons using extraction pattern contexts. In Proceedings of the conference on empirical methods for natural language processing (EMNLP)."},{"key":"5296_CR52","volume-title":"Proceedings of ACL 2005","author":"K. Toutanova","year":"2005","unstructured":"Toutanova, K., Haghighi, A., & Manning, C. D. (2005). Joint learning improves semantic role labeling. In Proceedings of ACL 2005."},{"key":"5296_CR53","volume-title":"Proceedings of the annual meeting of the association for computational linguistics (ACL)","author":"D. Yarowsky","year":"1995","unstructured":"Yarowsky, D. (1995). Unsupervised word sense disambiguation rivaling supervied methods. In Proceedings of the annual meeting of the association for computational linguistics (ACL)."},{"key":"5296_CR54","volume-title":"Semi-supervised learning literature survey","author":"X. Zhu","year":"2006","unstructured":"Zhu, X. (2006). Semi-supervised learning literature survey."}],"container-title":["Machine Learning"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10994-012-5296-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10994-012-5296-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10994-012-5296-5","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,4,25]],"date-time":"2024-04-25T00:54:05Z","timestamp":1714006445000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10994-012-5296-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,6,7]]},"references-count":54,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2012,9]]}},"alternative-id":["5296"],"URL":"https:\/\/doi.org\/10.1007\/s10994-012-5296-5","relation":{},"ISSN":["0885-6125","1573-0565"],"issn-type":[{"value":"0885-6125","type":"print"},{"value":"1573-0565","type":"electronic"}],"subject":[],"published":{"date-parts":[[2012,6,7]]}}}