{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T15:35:55Z","timestamp":1725550555516},"publisher-location":"Berlin, Heidelberg","reference-count":106,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540292425"},{"type":"electronic","value":"9783540316961"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2005]]},"DOI":"10.1007\/11564089_5","type":"book-chapter","created":{"date-parts":[[2005,10,10]],"date-time":"2005-10-10T13:51:09Z","timestamp":1128952269000},"page":"13-44","source":"Crossref","is-referenced-by-count":7,"title":["Algorithms and Software for Collaborative Discovery from Autonomous, Semantically Heterogeneous, Distributed Information Sources"],"prefix":"10.1007","author":[{"given":"Doina","family":"Caragea","sequence":"first","affiliation":[]},{"given":"Jun","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Jie","family":"Bao","sequence":"additional","affiliation":[]},{"given":"Jyotishman","family":"Pathak","sequence":"additional","affiliation":[]},{"given":"Vasant","family":"Honavar","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"5_CR1","volume-title":"Machine Learning","author":"T. Mitchell","year":"1997","unstructured":"Mitchell, T.: Machine Learning. McGraw Hill, New York (1997)"},{"key":"5_CR2","volume-title":"Pattern Recognition","author":"R. Duda","year":"2000","unstructured":"Duda, R., Hart, E., Stork, D.: Pattern Recognition. Wiley, Chichester (2000)"},{"key":"5_CR3","unstructured":"Thrun, S., Faloutsos, C., Mitchell, M., Wasserman, L.: Automated learning and discovery: State-of-the-art and research topics in a rapidly growing field. AI Magazine (1999)"},{"key":"5_CR4","doi-asserted-by":"crossref","DOI":"10.1007\/978-0-387-21606-5","volume-title":"The Elements of Statistical Learning : Data Mining, Inference, and Prediction","author":"T. Hastie","year":"2001","unstructured":"Hastie, T., Tibshirani, R., Friedman, J.: The Elements of Statistical Learning: Data Mining, Inference, and Prediction. Springer, Heidelberg (2001)"},{"key":"5_CR5","doi-asserted-by":"crossref","DOI":"10.1093\/oso\/9780198538493.001.0001","volume-title":"Neural Networks for Pattern Recognition","author":"C.M. Bishop","year":"1995","unstructured":"Bishop, C.M.: Neural Networks for Pattern Recognition. Oxford University Press, New York (1995)"},{"key":"5_CR6","volume-title":"Modeling the Internet and the Web - Probabilistic Methods and Algorithms","author":"P. Baldi","year":"2003","unstructured":"Baldi, P., Frasconi, P., Smyth, P.: Modeling the Internet and the Web - Probabilistic Methods and Algorithms. Wiley, New York (2003)"},{"key":"5_CR7","volume-title":"Bioinformatics - A Machine Learning Approach","author":"P. Baldi","year":"2003","unstructured":"Baldi, P., Brunak, S.: Bioinformatics - A Machine Learning Approach. MIT Press, Cambridge (2003)"},{"key":"5_CR8","volume-title":"Knowledge Representation: Logical, Philosophical, and Computational Foundations","author":"J. Sowa","year":"1999","unstructured":"Sowa, J.: Knowledge Representation: Logical, Philosophical, and Computational Foundations. PWS Publishing Co., New York (1999)"},{"key":"5_CR9","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1038\/75556","volume":"25","author":"M. Ashburner","year":"2000","unstructured":"Ashburner, M., Ball, C., Blake, J., Botstein, D., Butler, H., Cherry, J., Davis, A., Dolinski, K., Dwight, S., Eppig, J., Harris, M., Hill, D., Issel-Tarver, L., Kasarskis, A., Lewis, S., Matese, J., Richardson, J., Ringwald, M., Rubin, G., Sherlock, G.: Gene ontology: tool for unification of biology. Nature Genetics\u00a025, 25\u201329 (2000)","journal-title":"Nature Genetics"},{"key":"5_CR10","unstructured":"Reinoso-Castillo, J., Silvescu, A., Caragea, D., Pathak, J., Honavar, V.: Information extraction and integration from heterogeneous, distributed, autonomous information sources: a federated, query-centric approach. In: IEEE International Conference on Information Integration and Reuse, Las Vegas, Nevada (2003)"},{"key":"5_CR11","doi-asserted-by":"crossref","unstructured":"Caragea, D., Pathak, J., Honavar, V.: Learning classifiers from semantically heterogeneous data. In: Proceedings of the International Conference on Ontologies, Databases, and Applications of Semantics for Large Scale Information Systems (2004)","DOI":"10.1007\/978-3-540-30469-2_9"},{"volume-title":"Relational Data Mining","year":"2001","key":"5_CR12","unstructured":"Dzeroski, S., Lavrac, N. (eds.): Relational Data Mining. Springer, Heidelberg (2001)"},{"key":"5_CR13","doi-asserted-by":"crossref","unstructured":"Getoor, L., Friedman, N., Koller, D., Pfeffer, A.: Learning probabilistic relational models. In: Dzeroski, S., Lavrac, N.(eds.) Relational Data Mining. Springer, Heidelberg (2001)","DOI":"10.1007\/978-3-662-04599-2_13"},{"key":"5_CR14","first-page":"1300","volume-title":"Proceedings of the Sixteenth International Joint Conference on Artificial Intelligence","author":"N. Friedman","year":"1999","unstructured":"Friedman, N., Getoor, L., Koller, D., Pfeffer, A.: Learning probabilistic relational models. In: Proceedings of the Sixteenth International Joint Conference on Artificial Intelligence, Orlando, FL, pp. 1300\u20131309. Morgan Kaufmann Publishers Inc., San Francisco (1999)"},{"key":"5_CR15","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"38","DOI":"10.1007\/978-3-540-39917-9_5","volume-title":"Inductive Logic Programming","author":"A. Atramentov","year":"2003","unstructured":"Atramentov, A., Leiva, H., Honavar, V.: Learning decision trees from multi-relational data. In: In Horv\u00e1th, T., Yamamoto, A. (eds.) ILP 2003. LNCS (LNAI), vol.\u00a02835, pp. 38\u201356. Springer, Heidelberg (2003)"},{"key":"5_CR16","doi-asserted-by":"crossref","unstructured":"Neville, J., Jensen, D., Gallagher, B.: Simple estimators for relational bayesian classifiers. In: ICDM 2003 (2003)","DOI":"10.1109\/ICDM.2003.1250989"},{"key":"5_CR17","volume-title":"Statistical Inference","author":"G. Casella","year":"2001","unstructured":"Casella, G., Berger, R.: Statistical Inference. Duxbury Press, Belmont (2001)"},{"key":"5_CR18","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9780511815850","volume-title":"Statistical Models","author":"A. Davidson","year":"2003","unstructured":"Davidson, A.: Statistical Models. Cambridge University Press, London (2003)"},{"key":"5_CR19","doi-asserted-by":"publisher","first-page":"983","DOI":"10.1145\/293347.293351","volume":"45","author":"M. Kearns","year":"1998","unstructured":"Kearns, M.: Efficient noise-tolerant learning from statistical queries. Journal of the ACM\u00a045, 983\u20131006 (1998)","journal-title":"Journal of the ACM"},{"key":"5_CR20","doi-asserted-by":"crossref","unstructured":"Caragea, D., Silvescu, A., Honavar, V.: A framework for learning from distributed data using sufficient statistics and its application to learning decision trees. International Journal of Hybrid Intelligent Systems\u00a01 (2004)","DOI":"10.3233\/HIS-2004-11-210"},{"key":"5_CR21","doi-asserted-by":"crossref","unstructured":"Caragea, D., Silvescu, A., Honavar, V.: Decision tree induction from distributed heterogeneous autonomous data sources. In: Proceedings of the International Conference on Intelligent Systems Design and Applications, Tulsa, Oklahoma (2003)","DOI":"10.1007\/978-3-540-44999-7_33"},{"key":"5_CR22","series-title":"Lecture Notes in Artificial Intelligence","first-page":"53","volume-title":"Machine Learning: ECML 2000","author":"D. Caragea","year":"2000","unstructured":"Caragea, D., Silvescu, A., Honavar, V.: Agents that learn from distributed dynamic data sources. In: Lopez de Mantaras, R., Plaza, E. (eds.) ECML 2000. LNCS (LNAI), vol.\u00a01810, pp. 53\u201361. Springer, Heidelberg (2000)"},{"key":"5_CR23","unstructured":"Caragea, C., Caragea, D., Honavar, V.: Learning support vector machine classifiers from distributed data. extended abstract. In: Proceedings of the 22nd National Conference on Artificial Intelligence, AAAI 2005 (2005)"},{"key":"5_CR24","unstructured":"Caragea, D.: Learning classifiers from Distributed, Semantically Heterogeneous, Autonomous Data Sources. Ph.d. thesis, Department of Computer Science. Iowa State University, Ames, Iowa, USA (2004)"},{"key":"5_CR25","first-page":"81","volume":"1","author":"R. Quinlan","year":"1986","unstructured":"Quinlan, R.: Induction of decision trees. Machine Learning\u00a01, 81\u2013106 (1986)","journal-title":"Machine Learning"},{"key":"5_CR26","unstructured":"Breiman, L., Friedman, J., Olshen, R., Stone, C.: Classification and regression trees, Wadsworth, Monterey, CA (1984)"},{"key":"5_CR27","first-page":"204","volume-title":"Proceedings of the Fourth International Conference on KDD","author":"G. Graefe","year":"1998","unstructured":"Graefe, G., Fayyad, U., Chaudhuri, S.: On the efficient gathering of sufficient statistics for classification from large sql databases. In: Proceedings of the Fourth International Conference on KDD, pp. 204\u2013208. AAAI Press, Menlo Park (1998)"},{"key":"5_CR28","doi-asserted-by":"crossref","first-page":"67","DOI":"10.1613\/jair.453","volume":"8","author":"A.W. Moore","year":"1998","unstructured":"Moore, A.W., Lee, M.S.: Cached sufficient statistics for efficient machine learning with large datasets. Journal of Artificial Intelligence Research\u00a08, 67\u201391 (1998)","journal-title":"Journal of Artificial Intelligence Research"},{"key":"5_CR29","unstructured":"Wang, X., Schroeder, D., Dobbs, D., Honavar, V.: Data-driven discovery of rules for protein function classification based on sequence motifs: Rules discovered for peptidase families based on meme motifs outperform those based on prosite patterns and profiles. In: Proceedings of the Conference on Computational Biology and Genome Informatics (2002)"},{"key":"5_CR30","unstructured":"Andorf, C., Silvescu, A., Dobbs, D., Honavar, V.: Learning classifiers for assigning protein sequences to gene ontology functional families. In: Fifth International Conference on Knowledge Based Computer Systems (KBCS 2004), India (2004)"},{"key":"5_CR31","first-page":"273","volume":"20","author":"C. Cortes","year":"1995","unstructured":"Cortes, C., Vapnik, V.: Support vector networks. Machine Learning\u00a020, 273\u2013297 (1995)","journal-title":"Machine Learning"},{"key":"5_CR32","volume-title":"An Introduction to Support Vector Machines","author":"N. Cristianini","year":"2000","unstructured":"Cristianini, N., Shawe-Taylor, J.: An Introduction to Support Vector Machines. Cambridge University Press, Cambridge (2000)"},{"issue":"1","key":"5_CR33","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1080\/10556780008805771","volume":"13","author":"P.S. Bradley","year":"2000","unstructured":"Bradley, P.S., Mangasarian, O.L.: Massive data discrimination via linear support vector machines. Optimization Methods and Software\u00a013(1), 1\u201310 (2000)","journal-title":"Optimization Methods and Software"},{"key":"5_CR34","doi-asserted-by":"publisher","first-page":"237","DOI":"10.1023\/A:1009832825273","volume":"3","author":"A. Srivastava","year":"1999","unstructured":"Srivastava, A., Han, E., Kumar, V., Singh, V.: Parallel formulations of decision-tree classification algorithms. Data Mining and Knowledge Discovery\u00a03, 237\u2013261 (1999)","journal-title":"Data Mining and Knowledge Discovery"},{"key":"5_CR35","unstructured":"Grossman, L., Gou, Y.: Parallel methods for scaling data mining algorithms to large data sets. In: Zytkow, J. (ed.) Handbook on Data Mining and Knowledge Discovery. Oxford University Press, Oxford (2001)"},{"key":"5_CR36","doi-asserted-by":"publisher","first-page":"131","DOI":"10.1023\/A:1009876119989","volume":"3","author":"F.J. Provost","year":"1999","unstructured":"Provost, F.J., Kolluri, V.: A survey of methods for scaling up inductive algorithms. Data Mining and Knowledge Discovery\u00a03, 131\u2013169 (1999)","journal-title":"Data Mining and Knowledge Discovery"},{"key":"5_CR37","unstructured":"Park, B., Kargupta, H.: Constructing simpler decision trees from ensemble models using Fourier analysis. In: Proceedings of the 7th Workshop on Research Issues in Data Mining and Knowledge Discovery (DMKD 2002), Madison, WI, ACM SIGMOD, pp. 18\u201323 (2002)"},{"key":"5_CR38","first-page":"98","volume-title":"Proceedings of the Fourteenth International Conference on Machine Learning","author":"P. Domingos","year":"1997","unstructured":"Domingos, P.: Knowledge acquisition from examples via multiple models. In: Proceedings of the Fourteenth International Conference on Machine Learning, Nashville, TN, pp. 98\u2013106. Morgan Kaufmann, San Francisco (1997)"},{"key":"5_CR39","unstructured":"Prodromidis, A., Chan, P., Stolfo, S.: Meta-learning in distributed data mining systems: issues and approaches. In: Kargupta, H., Chan, P. (eds.) Advances of Distributed Data Mining. AAAI Press, Menlo Park (2000)"},{"key":"5_CR40","unstructured":"Bhatnagar, R., Srinivasan, S.: Pattern discovery in distributed databases. In: Proceedings of the Fourteenth AAAI Conference, Providence, pp. 503\u2013508. AAAI Press\/The MIT Press (1997)"},{"key":"5_CR41","unstructured":"Kargupta, H., Park, B., Hershberger, D., Johnson, E.: Collective data mining: A new perspective toward distributed data mining. In: Kargupta, H., Chan, P. (eds.) Advances in Distributed and Parallel Knowledge Discovery. MIT Press, Cambridge (1999)"},{"key":"5_CR42","doi-asserted-by":"crossref","unstructured":"Mansour, J.: Learning boolean functions via the fourier transform. In: Theoretical Advances in Neural Computation and Learning. Kluwer, Dordrecht (1994)","DOI":"10.1007\/978-1-4615-2696-4_11"},{"key":"5_CR43","doi-asserted-by":"crossref","first-page":"575","DOI":"10.1007\/978-1-4615-1567-8_24","volume-title":"Logic-based artificial intelligence","author":"A. Levy","year":"2000","unstructured":"Levy, A.: Logic-based techniques in data integration. In: Logic-based artificial intelligence, pp. 575\u2013595. Kluwer Academic Publishers, Dordrecht (2000)"},{"key":"5_CR44","series-title":"Lecture Notes in Bioinformatics","doi-asserted-by":"publisher","first-page":"175","DOI":"10.1007\/11530084_15","volume-title":"Data Integration in the Life Sciences","author":"D. Caragea","year":"2005","unstructured":"Caragea, D., Silvescu, A., Pathak, J., Bao, J., Andorf, C., Dobbs, D., Honavar, V.: Information integration and knowledge acquisition from semantically heterogeneous biological data sources. In: Lud\u00e4scher, B., Raschid, L. (eds.) DILS 2005. LNCS (LNBI), vol.\u00a03615, pp. 175\u2013190. Springer, Heidelberg (2005)"},{"key":"5_CR45","first-page":"192","volume-title":"Proceedings of the IEEE Conference on Information Integration and Reuse","author":"P. Bonatti","year":"2003","unstructured":"Bonatti, P., Deng, Y., Subrahmanian, V.: An ontology-extended relational algebra. In: Proceedings of the IEEE Conference on Information Integration and Reuse, pp. 192\u2013199. IEEE Press, Los Alamitos (2003)"},{"key":"5_CR46","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"164","DOI":"10.1007\/978-3-540-39718-2_11","volume-title":"The Semantic Web - ISWC 2003","author":"P. Bouquet","year":"2003","unstructured":"Bouquet, P., Giunchiglia, F., van Harmelen, F., Serafini, L., Stuckenschmidt, H.: C-OWL: Contextualizing ontologies. In: Fensel, D., Sycara, K., Mylopoulos, J. (eds.) ISWC 2003. LNCS, vol.\u00a02870, pp. 164\u2013179. Springer, Heidelberg (2003)"},{"key":"5_CR47","unstructured":"Bao, J., Honavar, V.: Collaborative ontology building with wiki@nt - a multi-agent based ontology building environment. In: Proceedings of the Third International Workshop on Evaluation of Ontology based Tools, at the Third International Semantic Web Conference ISWC, Hiroshima, Japan (2004)"},{"key":"5_CR48","unstructured":"Bao, J., Honavar, V.: An efficient algorithm for reasoning about subsumption and equivalence relationships to support collaborative editing of ontologies and inter-ontology mappings. under review (2005)"},{"key":"5_CR49","doi-asserted-by":"crossref","unstructured":"Hull, R.: Managing semantic heterogeneity in databases: A theoretical perspective. In: PODS, Tucson, Arizona, pp. 51\u201361 (1997)","DOI":"10.1145\/263661.263668"},{"key":"5_CR50","doi-asserted-by":"crossref","unstructured":"Davidson, S., Crabtree, J., Brunk, B., Schug, J., Tannen, V., Overton, G., Stoeckert, C.: K2\/Kleisli and GUS: experiments in integrated access to genomic data sources. IBM Journal\u00a040 (2001)","DOI":"10.1147\/sj.402.0512"},{"key":"5_CR51","doi-asserted-by":"crossref","unstructured":"Eckman, B.: A practitioner\u2019s guide to data management and data integration in bioinformatics. Bioinformatics, 3\u201374 (2003)","DOI":"10.1016\/B978-155860829-0\/50005-X"},{"key":"5_CR52","doi-asserted-by":"publisher","first-page":"183","DOI":"10.1145\/96602.96604","volume":"22","author":"A. Sheth","year":"1990","unstructured":"Sheth, A., Larson, J.: Federated databases: architectures and issues. ACM Computing Surveys\u00a022, 183\u2013236 (1990)","journal-title":"ACM Computing Surveys"},{"key":"5_CR53","unstructured":"Barsalou, T., Gangopadhyay, D.: M(dm): An open framework for interoperation of multimodel multidatabase systems. IEEE Data Engineering (1992)"},{"key":"5_CR54","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1109\/2.156378","volume":"25","author":"M. Bright","year":"1992","unstructured":"Bright, M., Hurson, A., Pakzad, S.: A taxonomy and current issues in multibatabase systems. Computer Journal\u00a025, 5\u201360 (1992)","journal-title":"Computer Journal"},{"key":"5_CR55","doi-asserted-by":"publisher","first-page":"38","DOI":"10.1109\/64.621227","volume":"12","author":"G. Wiederhold","year":"1997","unstructured":"Wiederhold, G., Genesereth, M.: The conceptual basis for mediation services. IEEE Expert\u00a012, 38\u201347 (1997)","journal-title":"IEEE Expert"},{"key":"5_CR56","doi-asserted-by":"crossref","unstructured":"Garcia-Molina, H., Papakonstantinou, Y., Quass, D., Rajaraman, A., Sagiv, Y., Ullman, J., Vassalos, V., Widom, J.: The TSIMMIS approach to mediation: data models and languages. Journal of Intelligent Information Systems, Special Issue on Next Generation Information Technologies and Systems\u00a08 (1997)","DOI":"10.1023\/A:1008683107812"},{"key":"5_CR57","doi-asserted-by":"crossref","unstructured":"Chang, C.K., Garcia-Molina, H.: Mind your vocabulary: query mapping across heterogeneous information sources. In: ACM SIGMOD International Conference On Management of Data, Philadelphia, PA (1999)","DOI":"10.1145\/304182.304212"},{"key":"5_CR58","doi-asserted-by":"publisher","first-page":"127","DOI":"10.1142\/S0218215793000071","volume":"2","author":"Y. Arens","year":"1993","unstructured":"Arens, Y., Chin, C., Hsu, C., Knoblock, C.: Retrieving and integrating data from multiple information sources. International Journal on Intelligent and Cooperative Information Systems\u00a02, 127\u2013158 (1993)","journal-title":"International Journal on Intelligent and Cooperative Information Systems"},{"key":"5_CR59","doi-asserted-by":"publisher","first-page":"145","DOI":"10.1142\/S0218843001000291","volume":"10","author":"C. Knoblock","year":"2001","unstructured":"Knoblock, C., Minton, S., Ambite, J., Ashish, N., Muslea, I., Philpot, A., Tejada, S.: The ariadne approach to Web-based information integration. International Journal of Cooperative Information Systems\u00a010, 145\u2013169 (2001)","journal-title":"International Journal of Cooperative Information Systems"},{"key":"5_CR60","doi-asserted-by":"crossref","unstructured":"Lu, J., Moerkotte, G., Schue, J., Subrahmanian, V.: Efficient maintenance of materialized mediated views. In: Proceedings of 1995 ACM SIGMOD Conference on Management of Data, San Jose, CA (1995)","DOI":"10.1145\/223784.223850"},{"key":"5_CR61","unstructured":"Levy, A.: The information manifold approach to data integration. IEEE Intelligent Systems\u00a013 (1998)"},{"key":"5_CR62","doi-asserted-by":"crossref","unstructured":"Draper, D., Halevy, A.Y., Weld, D.S.: The nimble XML data integration system. In: ICDE, pp. 155\u2013160 (2001)","DOI":"10.1109\/ICDE.2001.914824"},{"key":"5_CR63","doi-asserted-by":"crossref","unstructured":"Etzold, T., Harris, H., Beulah, S.: SRS: An integration platform for databanks and analysis tools in bioinformatics. Bioinformatics Managing Scientific Data, 35\u201374 (2003)","DOI":"10.1016\/B978-155860829-0\/50007-3"},{"key":"5_CR64","doi-asserted-by":"crossref","unstructured":"Haas, L., Schwarz, P., Kodali, P., Kotlar, E., Rice, J., Swope, W.: DiscoveryLink: a system for integrated access to life sciences data sources. IBM System Journal\u00a040 (2001)","DOI":"10.1147\/sj.402.0489"},{"key":"5_CR65","doi-asserted-by":"crossref","unstructured":"Stevens, R., Goble, C., Paton, N., Becchofer, S., Ng, G., Baker, P., Bass, A.: Complex query formulation over diverse sources in tambis. Bioinformatics, 189\u2013220 (2003)","DOI":"10.1016\/B978-155860829-0\/50009-7"},{"key":"5_CR66","doi-asserted-by":"crossref","unstructured":"Chen, J., Chung, S., Wong, L.: The Kleisli query system as a backbone for bioinformatics data integration and analisis. Bioinformatics, 147\u2013188 (2003)","DOI":"10.1016\/B978-155860829-0\/50008-5"},{"key":"5_CR67","doi-asserted-by":"crossref","unstructured":"Tannen, V., Davidson, S., Harker, S.: The information integration in K2. Bioinformatics, 225\u2013248 (2003)","DOI":"10.1016\/B978-155860829-0\/50010-3"},{"key":"5_CR68","doi-asserted-by":"publisher","first-page":"808","DOI":"10.1109\/69.729736","volume":"10","author":"A. Tomasic","year":"1998","unstructured":"Tomasic, A., Rashid, L., Valduriez, P.: Scaling heterogeneous databases and design of DISCO. IEEE Transactions on Knowledge and Data Engineering\u00a010, 808\u2013823 (1998)","journal-title":"IEEE Transactions on Knowledge and Data Engineering"},{"key":"5_CR69","unstructured":"Haas, L., Kossmann, D., Wimmers, E., Yan, J.: Optimizing queries across diverse sources. In: Proceedings of the 23rd VLDB Conference, Athens, Greece, pp. 267\u2013285 (1997)"},{"key":"5_CR70","doi-asserted-by":"crossref","unstructured":"Rodriguez-Martinez, M., Roussopoulos, R.: MOCHA: a self-extensible database middleware system for distributed data sources. In: Proceedings of the 2000 ACM SIGMOD International Conference on Management of Data, Dallas, TX, pp. 213\u2013224 (2000)","DOI":"10.1145\/342009.335413"},{"key":"5_CR71","first-page":"1204","volume-title":"Proceedings of the International Joint Conference on Artificial Intelligence","author":"E. Lambrecht","year":"1999","unstructured":"Lambrecht, E., Kambhampati, S., Gnanaprakasam, S.: Optimizing recursive information-gathering plans. In: Proceedings of the International Joint Conference on Artificial Intelligence, pp. 1204\u20131211. AAAI Press, Menlo Park (1999)"},{"key":"5_CR72","doi-asserted-by":"crossref","unstructured":"Maluf, D., Wiederhold, G.: Abstraction of representation in interoperation. In: Sommer, G. (ed.) AFPAC 1997. LNCS(LNAI), vol.\u00a01315. Springer, Heidelberg (1997)","DOI":"10.1007\/3-540-63614-5_43"},{"key":"5_CR73","unstructured":"Zhang, J., Honavar, V.: Learning decision tree classifiers from attribute-value taxonomies and partially specified data. In: Fawcett, T., Mishra, N. (eds.) Proceedings of the International Conference on Machine Learning, Washington, DC, pp. 880\u2013887 (2003)"},{"key":"5_CR74","doi-asserted-by":"crossref","unstructured":"Zhang, J., Honavar, V.: Learning concise and accurate naive bayes classifiers from attribute value taxonomies and data. In: Proceedings of the Fourth ICMD (2004)","DOI":"10.1007\/s10115-005-0211-z"},{"key":"5_CR75","doi-asserted-by":"publisher","first-page":"177","DOI":"10.1016\/0004-3702(88)90002-1","volume":"36","author":"D. Haussler","year":"1988","unstructured":"Haussler, D.: Quantifying inductive bias: AI learning algorithms and Valiant\u2019s learning framework. Artificial Intelligence\u00a036, 177\u2013221 (1988)","journal-title":"Artificial Intelligence"},{"key":"5_CR76","doi-asserted-by":"crossref","unstructured":"Friedman, N., Geiger, D., Goldszmidt, M.: Bayesian network classifiers. Machine Learning\u00a029 (1997)","DOI":"10.1023\/A:1007465528199"},{"key":"5_CR77","doi-asserted-by":"crossref","unstructured":"Caragea, D., Zhang, J., Pathak, J., Honavar, V.: Learning classifiers from distributed, ontology-extended data sources. under review (2005)","DOI":"10.1007\/11823728_35"},{"key":"5_CR78","unstructured":"Walker, A.: On retrieval from a small version of a large database. In: VLDB Conference 1989 (1989)"},{"key":"5_CR79","doi-asserted-by":"crossref","unstructured":"DeMichiel, L.: Resolving database incompatibility: An approach to performing relational operations over mismatched domains. IEEE Trans. Knowl. Data Eng.\u00a01 (1989)","DOI":"10.1109\/69.43423"},{"key":"5_CR80","doi-asserted-by":"crossref","unstructured":"Chen, A., Tseng, F.: Evaluating aggregate operations over imprecise data. IEEE Trans. On Knowledge and Data Engineering\u00a08 (1996)","DOI":"10.1109\/69.494166"},{"key":"5_CR81","doi-asserted-by":"crossref","unstructured":"McClean, S., Scotney, B., Shapcott, M.: Aggregation of imprecise and uncertain information in databases. IEEE Transactions on Knowledge and Data Engineering\u00a06 (2001)","DOI":"10.1109\/69.971186"},{"key":"5_CR82","unstructured":"Bergadano, F., Giordana, A.: Guiding induction with domain theories. In: Machine Learning An Artificial Intelligence Approach, vol.\u00a03. Morgan Kaufmann (1990)"},{"key":"5_CR83","doi-asserted-by":"crossref","unstructured":"Pazzani, M., Kibler, D.: The role of prior knowledge in inductive learning. Machine Learning\u00a09 (1992)","DOI":"10.1007\/BF00993254"},{"key":"5_CR84","doi-asserted-by":"crossref","unstructured":"Towell, G., Shavlik, J.: Knowledge-based artificial neural networks. Artificial Intelligence\u00a070 (1994)","DOI":"10.1016\/0004-3702(94)90105-8"},{"key":"5_CR85","unstructured":"Aronis, J., Kolluri, V., Provost, F., Buchanan, B.: The WoRLD: knowledge discovery from multiple distributed databases. Technical Report ISL-96-6, Intelligent Systems Laboratory, Department of Computer Science, University of Pittsburgh, Pittsburgh, PA (1996)"},{"key":"5_CR86","unstructured":"Aronis, J., Provost, F.: Increasing the efficiency of inductive learning with breadth-first marker propagation. In: Proceedings of the Third International Conference on Knowledge Discovery and Data Mining (1997)"},{"key":"5_CR87","doi-asserted-by":"crossref","unstructured":"Nunez, M.: The use of background knowledge in decision tree induction. Machine Learning\u00a06 (1991)","DOI":"10.1007\/BF00114778"},{"key":"5_CR88","doi-asserted-by":"crossref","unstructured":"Almuallim, H., Akiba, Y., Kaneda, S.: On handling tree-structured attributes. In: Proceedings of the Twelfth International Conference on Machine Learning (1995)","DOI":"10.1016\/B978-1-55860-377-6.50011-6"},{"key":"5_CR89","doi-asserted-by":"crossref","unstructured":"Dhar, V., Tuzhilin, A.: Abstract-driven pattern discovery in databases. IEEE Transactions on Knowledge and Data Engineering\u00a05 (1993)","DOI":"10.1109\/69.250075"},{"key":"5_CR90","unstructured":"Han, J., Fu, Y.: Exploration of the power of attribute-oriented induction in data mining. In: Fayyad, U.M. et al. (ed.) Advances in Knowledge Discovery and Data Mining. AAAI\/MIT Press (1996)"},{"key":"5_CR91","unstructured":"Hendler, J., Stoffel, K., Taylor, M.: Advances in high performance knowledge representation (1996)"},{"key":"5_CR92","unstructured":"Taylor, M., Stoffel, K., Hendler, J.: Ontology-based induction of high level classification rules. In: SIGMOD Data Mining and Knowledge Discovery workshop proceedings, Tuscon, Arizona (1997)"},{"key":"5_CR93","unstructured":"Pazzani, M., Mani, S., Shankle, W.: Beyond concise and colorful: Learning intelligible rules. In: Proceedings of the Fourth International Conference on Knowledge Discovery and Data Mining, Newport Beach, CA (1997)"},{"key":"5_CR94","unstructured":"Pazzani, M., Mani, M., Shankle, W.: Comprehensible knowledge discovery in databases. In: Proceedings of the the Cognitive Science Conference (1997)"},{"key":"5_CR95","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"260","DOI":"10.1007\/3-540-44914-0_16","volume-title":"Abstraction, Reformulation, and Approximation","author":"M. desJardins","year":"2000","unstructured":"desJardins, M., Getoor, L., Koller, D.: Using feature hierarchies in bayesian network learning. In: Choueiry, B.Y., Walsh, T. (eds.) SARA 2000. LNCS (LNAI), vol.\u00a01864, pp. 260\u2013270. Springer, Heidelberg (2000)"},{"key":"5_CR96","unstructured":"Rubin, D.: Multiple imputations in sample surveys: A phenomenological bayesian approach to nonresponse. In: Proceedings of the American Statistical Association, Section on Survey Research Methods, pp. 29\u201334 (1978)"},{"key":"5_CR97","doi-asserted-by":"publisher","DOI":"10.1002\/9780470316696","volume-title":"Multiple imputation for nonresponse in surveys","author":"D. Rubin","year":"1987","unstructured":"Rubin, D.: Multiple imputation for nonresponse in surveys. John Wiley and Sons, Chichester (1987)"},{"key":"5_CR98","doi-asserted-by":"crossref","unstructured":"Rubin, D.: Multiple imputation after 18+ years. Journal of the American Statistical Association\u00a091 (1996)","DOI":"10.1080\/01621459.1996.10476908"},{"key":"5_CR99","doi-asserted-by":"crossref","unstructured":"Junninen, H., Niska, H., Tuppurainen, K., Ruuskanen, J., Kolehmainen, M.: Methods for imputation of missing values in air quality data sets. Atmospheric Environment\u00a038 (2004)","DOI":"10.1016\/j.atmosenv.2004.02.026"},{"key":"5_CR100","doi-asserted-by":"crossref","unstructured":"Longford, N.: Missing data and small area estimation in the uk labour force survey. Journal of the Royal Statistical Society Series A-Statistics in Society\u00a0167 (2004)","DOI":"10.1046\/j.1467-985X.2003.00728.x"},{"key":"5_CR101","doi-asserted-by":"crossref","unstructured":"Raghunathan, T.: What do we do with missing data? some options for analysis of incomplete data. Annual Review of Public Health\u00a025 (2004)","DOI":"10.1146\/annurev.publhealth.25.102802.124410"},{"key":"5_CR102","doi-asserted-by":"crossref","DOI":"10.1002\/9781119013563","volume-title":"Statistical analysis with missing data","author":"R. Little","year":"2002","unstructured":"Little, R., Rubin, D.: Statistical analysis with missing data, 2nd edn. John Wiley and Sons, Chichester (2002)","edition":"2"},{"key":"5_CR103","unstructured":"Madow, W., Olkin, I., Rubin, D.B.: Incomplete data in sample surveys. Theory and bibliographies, vol.\u00a02. Academic Press, London (1983)"},{"key":"5_CR104","unstructured":"Madow, W., Nisselson, J., Olkin, I.: Incomplete data in sample surveys. Report and case studies, vol.\u00a01. Academic Press, New York, London (1983)"},{"key":"5_CR105","doi-asserted-by":"crossref","first-page":"i371","DOI":"10.1093\/bioinformatics\/bth920","volume":"20","author":"C. Yan","year":"2004","unstructured":"Yan, C., Dobbs, D., Honavar, V.: A two-stage classifier for identification of protein-protein interface residues. Bioinformatics\u00a020, i371\u2013i378 (2004)","journal-title":"Bioinformatics"},{"key":"5_CR106","first-page":"123","volume":"13","author":"C. Yan","year":"2004","unstructured":"Yan, C., Honavar, V., Dobbs, D.: Identifying protein-protein interaction sites from surface residues - a support vector machine approach. Neural Computing Applications\u00a013, 123\u2013129 (2004)","journal-title":"Neural Computing Applications"}],"container-title":["Lecture Notes in Computer Science","Algorithmic Learning Theory"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/11564089_5.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,30]],"date-time":"2024-01-30T21:32:42Z","timestamp":1706650362000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/11564089_5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2005]]},"ISBN":["9783540292425","9783540316961"],"references-count":106,"URL":"https:\/\/doi.org\/10.1007\/11564089_5","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2005]]}}}