% ---------------------------------------------------------------- \begin{thebibliography}{99} \bibliographystyle{apalike} \bibitem[Altschul et al. 1997]{BLAST} Altschul, S.F., Madden, T.L., Schaffer, A.A., Zhang, J., Zhang, Z., Miller,W., and Lipman, D.J. (1997). Gapped BLAST and PSI-BLAST: a new generation of protein database search programs. Nucleic Acids Research, {\bf 25:} 3389-3402. \bibitem[Bader et al. 2003]{BIND} Bader, G.D., Betel, D., and Hogue, C.W. (2003) BIND: the Biomolecular Interaction Network Database. Nucleic Acids Research, {\bf 31:} 248-50. \bibitem[Breitkreutz et al. 2003]{GRID} Breitkreutz, B.J., Stark, C., and Tyers M. (2003). The GRID: The General Repository for Interaction Datasets. Genome Biology, {\bf 4:} R23. \bibitem[Clare et al. 2002]{Clare} Clare, A., and King, R.D. (2002). Machine Learning of Functional Class from Phenotype Data. Bioinformatics, {\bf 18:} $160-166$. \bibitem[Costanzo et al. 2001]{YPD} Costanzo, M.C., Crawford, M.E., Hirschman, J.E., Kranz, J.E., Olsen, P., Robertson, L.S., Skrzypek, M.S., Braun, B.R., Hopkins, K.L., and Kondu, P. et al. (2001). YPD$^{TM}$, PombePD$^{TM}$, and WormPD$^{TM}$: model organism volumes of the BioKnowledge library, an integrated resource for protein information. Nucleic Acids Research, {\bf 29:} 75-79. \bibitem[Deane et al. 2002]{Deane} Deane, C.M., Salwinski, L., Xenarios, I., and Eisenberg, I. (2002). Protein interactions: Two methods for assessment of the reliability of high-throughput observation. Molecular and cellular proteomics, {\bf 1:} 349-356. \bibitem[Deng et al. 2002]{DengCSB} Deng, M.H., Zhang, K., Mehta, S., Chen, T., and Sun, F.Z. (2002). Prediction of Protein Function Using Protein-protein Interaction Data. In {\it Proceedings of the First IEEE Computer Society Bioinformatics Conference (CSB2002):} 197-206. \bibitem[Deng et al. 2003a]{DengPSB} Deng, M.H., Sun, F.Z., and Chen, T. (2003). Assessment of the Reliability of Protein-protein Interactions and Protein Function Prediction. {\it Pacific Symposium of Biocomputing (PSB2003):} 140-151. \bibitem[Deng et al. 2003b]{DengRECOMB} Deng, M.H., Chen, T., and Sun, F.Z. (2003). An Integrated Probabilistic Model for Functional Prediction of Proteins. In {\it Proceedings of the Seventh International Conference on Computational Molecular Biology (RECOMB2003):} 95-103. \bibitem[Deng et al. 2004]{Minghua2004} Deng, M.H., Tu, Z.D., Sun, F.Z., and Chen, T. (2004) Mapping gene ontology to proteins based on protein-protein interaction data. Bioinformatics 20: 895-902. \bibitem[Dwight et al. 2002]{SGD} Dwight, S.S., Harris, M.A., Dolinski, K., Ball, C.A., Binkley, G., Christie, K.R., Fisk, D.G., Issel-Tarver, L., Schroeder, M., and Sherlock, G. et al. (2002). Saccharomyces Genome Database (SGD) Provides Secondary Gene Annotation Using the Gene Ontology (GO). Nucleic Acids Research, {\bf 30:} 69-72. \bibitem[Drawid et al. 2000] {DrawidJMB} Drawid, A., and Gerstein, M. (2000). A Bayesian System Integrating Expression Data with Squence Patterns for Localizing Proteins: Comprehensive Application to the Yeast Genome. Journal of Molecular Biology, {\bf 301:} $1059-1075$. \bibitem[Eisen et al. 1998]{Eisen} Eisen, M.B., Spellman, P.T., Brown, P.O. and Bostein D. (1998). Cluster analysis and display of genome-wide expression patterns. Proceedings of the National Academy of Sciences USA, {\bf 95:} 14863-14868. \bibitem[Enright et al. 1999]{Enright} Enright, A.J., Iliopoulos, I., Kyrpides N.C. and Ouzounis, C.A. (1999). Protein interaction maps for complete genomes based on gene fusion events. Nature, {\bf 402:} 86-90. \bibitem[Fellenberg et al. 2000]{Fellenberg} Fellenberg, M., Albermann, K., Zollner, A., Mewes, H.W. and Hani, J. (2000). Integrative Analysis of Protein Ineraction Data. In {\it Proc. of the Eighth Int. Conf. on Intelligent System for Molecular Biology (ISMB2000)}: 152-161. \bibitem[Frank and Strauss 1986]{Frank and Strauss 1986} Frank O., Strauss D. (1986) Markov graphs. Journal of American Statistical Association, 81: 832-842. \bibitem[Gavin et al. 2002]{Gavin et al. 2002} Gavin, A., B$\ddot{o}$che, M., Krause, R., Grandi, P., Marzioch, M., Bauer, A., Schultz, J., Rick, J.M., Michon, A., Cruciat, C. et al. (2002) Functional organization of the yeast proteome by systematic analysis of protein complexes. Nature, {\bf 415:} $141-147$. \bibitem[GO Consortium 2001]{GO2001} The Gene Ontology Consortium. (2001). Creating the Gene Ontology Resource: Design and Implementation. Genome Research {\bf 11:} 1425-1433. \bibitem[Gupta et al. 2002]{GuptaPSB} Gupta, R., and Brunak, S. (2002). Prediction of Glycosylation Across the Human Proteome and the Correlation to Protein Function. {\it Pacific Symposium of Biocomputing (PSB2002):} $310-322$. \bibitem[Hegyi et al. 1999]{HegyiJMB} Hegyi, H., and Gerstein, M. 1999.The Relationship Between Protein Structure and Function: a Comprehensive Survey with Application to Yeast Genome. Journal of Molecular Biology, {\bf 288:} $147-164$. \bibitem[Hegyi et al. 2001]{HegyiGR} Hegyi, H., and Gerstein, M. 2001. Annotation Transfer for Genomics: Measuring Fuctinal Divergence in Multi-domain Proteins. Genome Research, {\bf 11:} $1632-1640$. \bibitem[Hishigaki et al. 2001]{Hishigaki} Hishigaki, H., Nakai, K., Ono, T., Tanigami, A., and Takagi, T. (2001). Assessment of prediction accuracy of protein function from protein-protein interaction data. Yeast, {\bf 18:} 523-531. \bibitem[Ho et al. 2002]{HoComplexMS} Ho, Y., Gruhler, A., Heilbut, A., Bader, G.D., Moore, L., Adams, S., Millar, A., Taylor, P., Bennett, K., and Boutilier, K., et al. (2002). Systematic Identification of Protein Complexes in {\it Saccharomyces Cerevisiae} by Mass Spectrometry. Nature, {\bf 415:} $180-183$. \bibitem[Huh et al. 2003]{Huh} Huh, W.K., Falvo, J.V., Gerke, L.C., Carroll, A.S., Howson, R.W., Weissman, J.S., O'Shea, E.K. (2003). Global analysis of protein localization in budding yeast. Nature, {\bf 425(6959):} $686-91$ \bibitem[Huynen et al. 2003]{Huynen et al. 2003} Huynen, M.A., Snel, B., von Mering, C., and Bork, P. (2003) Function prediction and protein networks. Current Opinion in Cell Biology, {\bf 15:} 191-198. \bibitem[Ito et al. 2000]{Ito2000} Ito, T., Tashiro, K., Muta, S., Ozawa, R., Chiba, T., Nishizawa, M., Yamamoto,K., Kuhara, S., and Sakaki, Y. (2000). Toward a protein-protein interaction map of the budding yeast: a comprehensive system to examine two-hybrid interactions in all possible combinations between the yeast proteins. Proceedings of the National Academy of Sciences USA, {\bf 97:} 1143-1147. \bibitem[Ito et al. 2001]{Ito2001} Ito, T., Chiba, T., Ozawa, R., Yoshida, M., Hattori, M. and Sakaki, Y. (2001). A Comprehensive two hybrid analysis to explore the yeast protein interactome. Proceedings of the National Academy of Sciences USA, {\bf 98:} 4569-4574. \bibitem[Jaimovich et al. 2005]{Jaimovich et al. 2005} Jaimovich, A., Elidan, G., Margalit, H., and Friedman, N. (2005) Towards an Integrated Protein-protein Interaction Network. In {\it Proceedings of the Ninth International Conference on Computational Molecular Biology (RECOMB2005):} 14-30. \bibitem[Jansen et al. 2003]{Jansen et al. 2003} Jansen, R., Yu, H.Y., Greenbaum, D., Kluger, Y., Krogan, N.J., Chung, S.B., Emili, A., Snyder, M., Greenblatt, J.F., and Gerstein, M. (2003) A Bayesian networks approach for predicting protein-protein interactions from genomic data. SCIENCE, {\bf 302:} 449-453. \bibitem[Jensen et al. 2002]{JensenJMB} Jensen, L.J., Gupta, R., Blom,N., Devos, D., Tamames, J., Kesmir, C., Nielsen, H., St$\ae$rfeldt,~H.H, Rapacki,K., and Workman, C., et. al. (2002). Prediction of Human Protein Function from Post-translational Modifications and Localization Features. Journal of Molecular Biology, {\bf 319:} $1257-1265$. \bibitem[Kell et al. 2000]{Kell2000} Kell, D.B., and King, R.D. (2000). On the optimization of Classes for the Assignment of Unidentified Reading Frames in Functional Genomics Programmes: the Need for Machine Learning. Trends Biotechnology {\bf 18:} $93-98$. \bibitem[King et al. 2001]{King} King, R.D. , Karwath, A., Clare, A., and Dehaspe, L. (2001). The Utility of Different Representations of Protein Sequence for Predicting Functional Class. Bioinformatics, {\bf 17:} $445-454$. \bibitem[Kondor and Lafferty 2002]{Kondor and Lafferty 2002} Kondor, R.I., and Lafferty, J. (2002) Diffusion kernels on graphs and ohter discrete inpute spaces. In {\it Proceedings of International Conference on Machine Learning} 315-322. \bibitem[Lanckriet et al. 2004a]{Lanckriet et al. 2004a} Lanckriet, G.R.G., Deng, M., Cristianini, N., Jordan, M.I., and Noble, W.S. (2004) Kernel-based data fusion and its appliation to protein function prediction in yeast. Proceedings of the Pacific Symposium on Biocomputing: 300-311. \bibitem[Lanckriet et al. 2004b]{Lanckriet et al. 2004} Lanckriet, G.R.G., Deng, M.H., Cristianini, N., Jordan, M.I., and Noble, W.S. (2004) Kernel-based integration of genomic data using semidefinite programming. In Sch$\ddot{o}$lkopf B, Tsuda K, and Vert J.-P (eds) \emph{Kernel Methods in Computational Biology,} MIT press, Cambridge, MA pp. 71-92. \bibitem[Lanckriet et al. 2004c]{Lanckriet et al. 2004c} Lanckriet, G.R.G., Bie, T.D., Cristianini, N., Jordan, M.I., and Noble, W.S. (2004) A statistical framework for genomic data fusion. Bioinformatics, {\bf 20:} 2626-2635. \bibitem[Lee et al. 2005a]{Lee_location} Lee, H.J., Deng, M.H., Sun, F.Z., and Chen, T. (2005) Assessment of the Reliability of Protein-Protein Interactions Using Protein Localization and Gene Expression Data. Proceedings of the International Joint Conference of InCoB, AASBi and KSBI (BIOINFO 2005). \bibitem[Lee et al. 2005b]{Lee_function} Lee, H.J., Tu, Z.D., Deng, M.H., Sun, F.Z., and Chen, T. (2005) Diffusion Kernel Based Logistic Regression Models for Pro- tein Function Prediction. Technical Report. \bibitem[Letovsky and Kasif 2003]{Letovsky} Letovsky, S. and Kasif, S. (2003). Predicting protein function from protein/protein interaction data: a probabilistic approach. Bioinformatics, {\bf 19 (Suppl.1):} 197-204. \bibitem[Li 1995]{LiSZ} Li, S.Z. (1995). Markov random field modeling in Computer vision. Springer-Verlag: Tokyo. \bibitem[Lin et al. 2004]{Lin et al. 2004} Lin, N., Wu, B., Jansen, R., Gerstein, M. and Zhao, H.Y. (2004) Information assessment on predicting protein-protein interactions. BMC Bioinformatics, {\bf 5:} 154 \bibitem[Liu 2001]{LiuJS} Liu, J.S. (2001). Monte Carlo strategies in scientific computing. Springer-Verlag: New York. \bibitem[Lu et al. 2005]{Lu et al. 2005} Lu, L.J., Xia, Y., Paccanaro, A., Yu, H.Y. and Gerstein, M. (2005) Assessing the limits of genomic data integration for predicting protein networks Genome Reserach, {\bf 15:} 945-953. \bibitem[Marcotte et al. 1999a]{EisenbergRosetta} Marcotte, E.M., Pellegrini, M., Ng, H.L., Rice,D.W., Yeates, T.O. and Eisenberg, D. (1999). Detecting protein function and protein-protein interactions from genome sequences. Science, {\bf 285:} 751-753. \bibitem[Marcotte et al. 1999b]{EisenbergCombined} Marcotte, E.M., Pellegrini, M., Thompson, M.J., Yeates, T.O. and Eisenberg, D. (1999). A combined algorithm for genome-wide prediction of protein function. Nature, {\bf 402:} 83-86. \bibitem[Mering et al. 2002]{MeringNature} Mering, C.V., Krause, R. Snel, M., Oliver, S.G., Fields, S. and Bork, P. (2002) Comparative assessment of large scale data sets of protein-protein interactions. Nature, {\bf 417:} $399-403$. \bibitem[Mewes et al. 2002]{MIPS} Mewes, H. W., Frishman, D., Guldener, U., Mannhaupt, G., Mayer, K., Mokrejs, M., Morgenstern, B., Munsterkotter, M., Rudd, S., and Weil, B. (2002). MIPS: a database for genomes and protein sequences. Nucleic Acids Research, {\bf 30:} 31 - 34. \bibitem[Mrowka et al. 2001]{Mrowka} Mrowka, R., Patzak, A., and Herzel, H. (2001) Is there a bias in proteome Research? Genome Research, {\bf 11}: 1971-1973 \bibitem[Overbeek et al. 1999]{Overbeek} Overbeek, R., Fonstein, M., D'Souza, M., Pusch, G.D., and Maltsev, N. (2000). The use of gene clusters to infer functional coupling. Proceedings of the National Academy of Sciences USA, {\bf 96:} 2896-2901. \bibitem[Pavlidis et al. 2001]{Pavlidis} Pavlidis, P., and Weston, J. (2001). Gene functional classification from heterogeneous data. In {\it Proceedings of the Fifth International Conference on Computational Molecular Biology (RECOMB2001):} 249 - 255. \bibitem[Pearson et al. 1988]{FASTA} Pearson, W.R., and Lipman, D.J. (1988). Improved tools for biological sequence comparison. Proceedings of the National Academy of Sciences USA, {\bf 85:} 2444 - 2448. %\vfill\eject \bibitem[Pellegrini et al. 1999]{EisenbergPhylogenetic} Pellegrini, M., Marcotte, E.M., Thompson, M.J., Eisenberg, D., and Yeates, T.O. (1999). Assigning protein functions by comparative genome analysis: protein phylogenetic profiles. Proceedings of the National Academy of Sciences USA, {\bf 96:} 4285-4288. \bibitem[Pilpel et al. 2001]{Pilpel et al. 2001} Pilpel, Y., Sudarsanam, P., and Church, G.M. (2001) Identifying regulatory networks by combinatorial analysis of promoter elements. Nature Genetics, 29: 153-159 \bibitem[Saito et al. 2003]{Saito et al. 2003} Saito, R., Suzuki, H., and Hayashizaki, Y. (2003) Construction of reliable protein-protein interaction networks with a new interaction generality measure. Bioinformatics, 19: 756-763 \bibitem[Schwikowski et al. 2000]{Schwikowski} Schwikowski, B., Uetz, P., and Fields, S. (2000). A network of protein-protein interactions in yeast. Nature Biotechnology, {\bf 18:} 1257-1261. \bibitem[Stawiki et al. 2002]{StawiskiPSB} Stawiki, E.W., Mandel-Gutfreund, Y., Lowenthal, A.C., and Gregoret, L.M. (2002). Progress in Predicting Protein Function from Structure: Unique features of O-Glycosidases. {\it Pacific Symposium of Biocomputing (PSB2002):} $637-648$. \bibitem[Sturm 1999]{Sturm} Sturm, J.F. (1999) Using SeDuMi 1.02, a MATLAB toolbox for optimization over symmetric cones. Optimization Methods and Software, {\bf 11-12:} 625-653. \bibitem[Tong et al. 2002]{Tong} Tong, A.H.Y., Drees, B., Nardelli, G., Bader, G.D., Brannetti, B., Castagnoli, L., Evangelista, M., Paoluzi, S., Quondam, M., Zucconim A, et al.. (2002). A combined experimental and computational strategy to define protein interaction networks for peptide recognition modules. Science, {\bf 295}: $321-324$. \bibitem[Troyanskaya et al. 2003]{Troyanskaya et al. 2003} Olga G. Troyanskaya, O.G., Dolinski, K., Art B.O., Altman, R.B., and Botstein, D. (2003) A Bayesian framework for combining heterogeneous data sources for gene function prediction (in Saccharomyces cerevisiae). Proceedings of the National Academy of Sciences USA, {\bf 100:} 8348-8353 \bibitem[Tu et al. 2005]{Tu et al. 2005} Tu, Z.D., Lee, H.J., Deng, M.H., Chen, T., and Sun, F.Z. (2005) Understanding Protein Essentiality - Linking Genomic Information with Phenotype. {\it Technical Report.} \bibitem[Uetz et al. 2000]{Uetz2000} Uetz, P., Giot, L., Cagney, G., Mansfield, T.A., Judson, R.S., Knight, J.R., Lockshon, D., Narayan, V., Srinivasan, M., Pochart, et al. (2000). A Comprehensive analysis of protein-protein interactions in Saccharomyces cerevisiae. Nature, {\bf 403}: 623-627. \bibitem[Vazquez et al. 2003]{Vazquez} Vazquez, A., Flammini, A., Maritan, A., and Vespignani, A. (2003). Global protein function prediction from protein¨Cprotein interaction networks. Nature Biotechnology, {\bf 21:} 697-700. \bibitem[Venables et al. 1996]{Splus} Venables, W.N., and Ripley, B.D. (1996). Modern Applied Statistics with S$-$Plus. Springer-Verlag; New York. \bibitem[Xenarios et al. 2002]{DIP} Xenarios,~I., Salwinski,~L., Duan,~X.J., Higney,~P., Kim,~S., and Eisenberg, D. (2002). DIP: The Database of Interacting Proteins. A research tool for studying cellular networks of protein interactions. Nucleic Acids Research, {\bf 30} 303-305. \bibitem[Zheng et al. 2002]{YuZheng} Zheng, Y., Roberts R.J., and Kasif, S. (2003). Genomeic functional annotation using co-evolution profiles of gene clusters. Genome Biology, {\bf 3:} 1-9. \bibitem[Zhou et al. 2002]{ZhouXH} Zhou, X.H., Kao, M., and Wong, W. (2002). Transitive Functional Annotation by Shortest-path Analysis of Gene Expression Data. Proceedings of the National Academy of Sciences USA, {\bf 99:} 12783 - 12788. \end{thebibliography}