The complexity of the problem is reduced by a set of filters that eliminate potential correpsondences between vertices with different intramolecular distances, different electrostatic potentials, different lipophilic potentials, different principal curvatures on the Connolly surfaces, different harmonic shape images for their neighborhoods on the Connolly surfaces, and different orientations of the aligned harmonic shape images with respect to the line segment between any pair of points. ``The approach was tested on dihydrofolate reductase and thermolysin inhibitors and was shown to recover the correct alignments of the compounds bound in the active sites.''", } @Article{Kinoshita05, author = "K. Kinoshita and and H. Nakamura", title = "Identification of the ligand binding sites on the molecular surface of proteins", journal = "Protein Science", volume = "14", year = "2005", pages = "711-718", comment = "This paper contains results of an experiment for comparison of a few binding site surfaces to a large database (almost all binding site surfaces in the PDB) using the method described in [Kinoshita03]. Since partial surfaces are matched, a similarity scoring method is introduced that considers both a normalized score for the match of the geometry and electrostatics (Z-score) and the ``coverage'' of the match (fractions of the surfaces found to be in correspondence). Results are presented for 18 hypothetical proteins.", } @Article{Kinoshita04, author = "K. Kinoshita and H. Nakamura", title = "{eF-site and PDBViewer}: database and viewer for protein functional sites", journal = "Bioinformatics", year = "2004", volume = "20", pages = "1329-1330", comment = "http://ef-site.hgc.jp/eF-site/", } @Article{Kinoshita03, author = "K. Kinoshita and and H. Nakamura", title = "Identification of protein biochemical functions by similarity search using the molecular surface database {eF-site}", journal = "Protein Science", volume = "12", year = "2003", pages = "1589-1595", comment = "This paper describes matching of surfaces stored in the eF-site database of binding sites. Each binding site is represented by a mesh with electrostatic potential and the 2 principal curvatures at every vertex. The meshes are matched using association graphs, where the electrostatic potentials and principal curvatures have to match within some threshold, as well as the intramolecular distances. No reduction of the point set is performed (e.g., using critical points). Results are shown for matching examples of two SCOP folds and for predicting the biochemical function of one hypothetical protein.", } @Article{Kinoshita02, author = "K. Kinoshita and J. Furui and H. Nakamura", title = "Identification of Protein Functions from a Molecular Surface Database, {eF}-site", year = "2002", journal = "J. Struct. Func. Genomics", volume = "2", number = 1, pages = "9-Binding", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand binding site representations with surfaces and matching with geometric hashing %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Lin94, author = "S.L. Lin and R. Nussinov and D. Fischer and H.J. Wolfson", title = "Molecular-Surface Representations By Sparse Critical-Points", journal = "Proteins-Structure Function and Genetics", volume = "18", year = "1994", pages = "94-101", comment = "This paper describes a surface representation consisting of ``a limited number of critical points disposed at key locations over the surface. These points adequately represent the shape and the important characteristics of the surface, despite the fact that they are modest in number.'' Using this representation, they investigate protein-protein and protein-small molecule docking." } @Article{Rosen98, author = "M. Rosen and S.L. Lin and H. Wolfson and R. Nussinov", title = "Molecular shape comparisons in searches for active sites and functional similarity", journal = "Protein Engineering", volume = "11", year = "1998", pages = "263-277", comment = "This paper uses geometric hashing to examine ``the reliability of surface comparisons in searches for active sites in proteins. Specifically, we compare the efficacy of molecular surface comparisons with comparisons of surface atoms and of C(alpha) backbone atoms. We further investigate comparisons of specific atoms, belonging to a predefined pattern of catalytic residues versus comparisons of molecular surfaces and, separately, of surface atoms. We also explore active site comparisons versus comparisons in which the entire molecular surfaces are scanned. While here we focus on the geometrical aspect of the problem, we also investigate the effect of adding residue labels in these comparisons. Our extensive studies cover the serine proteases, containing the highly conserved triad motif, and the chorismate mutases. Our results show that molecular surface comparisons work best when the similarity is high. As the similarity deteriorates, the number of potential solutions increases rapidly, making their ranking difficult, particularly when scanning entire molecular surfaces. Utilizing atomic coordinates directly appears more adequate under such circumstances.''", } @Article{Fischer93, author = "D. Fischer and R. Norel and H. Wolfson and R. Nussinov", title = "Surface motifs by a computer vision technique: searches, detection, and implications for protein-ligand recognition", journal = "Proteins", volume = "16", year = "1993", pages = "278-292", comment = "This paper uses geometric hashing to perform ``4 types of comparisons between pairs of molecules: (1) comparison of the backbones of two protein domains; (2) search for a predefined 3-D C alpha motif within the full backbone of a domain; and in particular, (3) comparison of the surfaces of two receptor proteins; and (4) comparison of the surface of a receptor to the surface of a ligand. ... Searches for 3-D surface motifs can be carried out on either receptors or on ligands.''", } @Article{Bachar93, author = "O. Bachar and D. Fischer and R. Nussinov and H. Wolfson", title = "A Computer Vision-Based Technique For {3-D} Sequence-Independent Structural Comparison Of Proteins", journal = "Protein Engineering", volume = "6", year = "1993", pages = "279-288", comment = "Uses geometric hashing", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand binding site representations with surfaces and matching with genetic algorithms %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Poirrette97, author = "A.R. Poirrette and P.J. Artymiuk and D.W. Rice and P. Willett", title = "Comparison of protein surfaces using a genetic algorithm", journal = "Journal of Computer-Aided Molecular Design", volume = "11", year = "1997", pages = "557-569", comment = "``A genetic algorithm (GA) is described which is used to compare the solvent-accessible surfaces of two proteins or fragments of proteins, represented by a dot surface calculated using the Connolly algorithm. The GA is used to move one surface relative to the other to locate the most similar surface region between the two. The matching process is enhanced by the use of the surface normals and shape terms provided by the Connolly program and also by a simple hydrogen-bonding descriptor and an additional shape descriptor. The algorithm has been tested in applications ranging from the comparison of small surface patches to the comparison of whole protein surfaces. Examples of the matches are given and a quantitative analysis of the quality of the matches is performed.''", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand binding site representations with radial extents and matching with spherical harmonic surfaces %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Kahraman07, author = "A. Kahraman and R.J. Morris and R. Laskowski and J.M. Thornton", title = "Shape Variation in Protein Binding Pockets and their Ligands", journal = "J. Mol. Biol.", year = "2007", volume = "368", pages = "283-301", comment = "A common assumption about the shape of protein binding pockets is that they are related to the shape of the small ligand molecules that can bind there. But to what extent is that assumption true? Here we use a recently developed shape matching method to compare the shapes of protein binding pockets to the shapes of their ligands. We find that pockets binding the same ligand show greater variation in their shapes than can be 2 John Innes Centre, Norwich accounted for by the conformational variability of the ligand. This suggests Research Park, Colney Lane, that geometrical complementarity in general is not sufficient to drive Norwich, NR7 7UH, UK molecular recognition. Nevertheless, we show when considering only shape and size that a significant proportion of the recognition power of a binding pocket for its ligand resides in its shape. Additionally, we observe a buffer zone or a region of free space between the ligand and protein, which results in binding pockets being on average three times larger than the ligand that they bind.", } @Article{Morris05a, author = "R.J. Morris and R.J. Najmanovich and A. Kahraman and J.M. Thornton", title = "Real spherical harmonic expansion coefficients as {3D} shape descriptors for protein binding pocket and ligand comparisons", journal = "Bioinformatics", volume = "21", number = "10", year = "2005", pages = "2347-2355", comment = "This paper ``uses the coefficients of a real spherical harmonics expansion to describe the shape of a protein's binding pocket.'' Binding sites are represented by the radial extent of surfnet spheres within 3.5 angstroms of a conserved residue. The resulting spherical functions are aligned with PCA, only the highest order spherical harmonic coefficients are retained, and shape similarity is computed as the L2 distance between corresponding spherical harmonic coefficients." } @InProceedings{Morris05b, author = "R.J. Morris and A. Kahraman and T. Funkhouser and R. Najmanovich and G. Stockwell and F. Glaser and R. Laskowski and J.M. Thornton", title = "Binding Pocket Shape Analysis for Protein Function Prediction", booktitle = "{LASR} Workshop on Quantitative Biology, Shape Analysis, and Wavelets", location = "Leeds England", month = "June", year = "2005", } @Article{Cai02, author = "W. Cai and X. Shao and B. Maigret", title = "Protein-ligand recognition using spherical harmonic molecular surfaces: towards a fast and efficient filter for large virtual throughput screening", journal = "Journal of Molecular Graphics and Modeling", volume = "20", pages = "313-328", year = "2002", comment = "``In this paper, we present an extension of our work to spherical harmonic surfaces in order to approximate molecular surfaces of both ligands and receptor-cavities and to easily check the surface-shape complementarity. The method consists of (1) finding lobes and holes on both ligand and cavity surfaces using contour maps of radius functions with spherical harmonic expansions, (2) superposing the surfaces around a given binding site by minimizing the distance between their respective expansion coefficients. This docking procedure capabilities was demonstrated by application to 35 protein-ligand complexes of known crystal structures.''" } @Article{Cai98, author = "W. Cai and M. Zhang and B. Maigret", title = "New approach for representation of molecular surface", journal = "J. Comput. Chem", volume = "19", year = "1998", pages = "1805-1815", } @Article{Ritchie99, author = "D.W. Ritchie and G.J.L. Kemp", title = "Fast computation, rotation, and comparison of low resolution spherical harmonic molecular surfaces", journal = "J. Comput. Chem", volume = "20", year = "1999", pages = "383-395", comment = "Describes Fourier search algorithm for optimal rotational alignment", } @Article{Duncan93a, author = "B.S. Duncan and A.J. Olson", title = "Shape analysis of molecular surfaces", journal = "Biopolymers", volume = "33", year = "1993", pages = "231-238", } @Article{Duncan93b, author = "B.S. Duncan and A.J. Olson", title = "Approximation and characterization of molecular surfaces", journal = "Biopolymers", volume = "33", year = "1993", pages = "219-229", } @Article{Leicester88, author = "S. Leicester and J.L. Finney and R.P. Bywater", title = "Description of molecular surface shape using {F}ourier descriptors", journal = "J. Mol. Graph", volume = "6", year = "1988", pages = "104-108", } @Article{Max88, author = "N.L. Max and E.D. Getzoff", title = "Spherical harmonic molecular surfaces", journal = "IEEE Comput. Graph. Appl", volume = "8", year = "1988", pages = "42-50", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand binding site representations and matching with other methods %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Goldman00, author = "B.B. Goldman and W.T. Wipke", title = "{Quadratic Shape Descriptors} 1. Rapid Superposition of Dissimilar Molecules Using Geometrically Invariant Surface Descriptors", journal = "J. Chem. Inf. Model.", volume = "40:, number = "3", year = "2000", pages = "644-658", } @InProceedings{Funkhouser05b, author = "T. Funkhouser and F. Glaser and R. Laskowski and R. Morris and R. Najmanovich and G. Stockwell and J.Thornton", title = "Shape-Based Classification of Bound Ligands", booktitle = "{LASR} Workshop on Quantitative Biology, Shape Analysis, and Wavelets", location = "Leeds England", month = "June", year = "2005", } @Article{Exner02a, author = "T.E. Exner and M. Keil and J. Brickmann", title = "Pattern recognition strategies for molecular surfaces. {I.} Pattern generation using fuzzy set theory", journal = "Journal of Computational Chemistry", volume = "23", year = "2002", pages = "1176-1187", } @Article{Exner02b, author = "T.E. Exner and M. Keil and J. Brickmann", title = "Pattern recognition strategies for molecular surfaces. {II.} Surface complementarity", journal = "Journal of Computational Chemistry", volume = "23", year = "2002", pages = "1188-1197", comment = "``Fuzzy logic based algorithms for the quantitative treatment of complementarity of molecular surfaces are presented. ... The algorithms are applied to 33 biomolecular complexes. ... After the optimization with a downhill simplex method, for all these complexes one structure was found, which is in very good agreement with the experimental results.''", } @InProceedings{Gu03, author = "X. Gu and {S.-T.} Yau", title = "Surface Classification Using Conformal Structures", booktitle = "Ninth {IEEE} International Conference on Computer Vision ({ICCV'03})", volume = "1", year = "2003", pages = "701", comment = "This paper provides a way to map a surface from 3D to 2D (flatten it) while retaining the angles between edges of the mesh as best as possible (a conformal map). The surfaces are compared/classified in the 2D domain.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand binding site representations with alpha-shapes %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Liang98a, author = "J. Liang and H. Edelsbrunner and P. Fu and P.V. Sudhakar and S. Subramaniam", year = "1998", title = "Analytical shape computing of macromolecules I: molecular area and volume through alpha shape", journal = "Proteins", volume = "33", pages = "1-17", } @Article{Liang98b, author = "J. Liang and H. Edelsbrunner and P. Fu and P.V. Sudhakar and S. Subramaniam", title = "Analytical shape computing of macromolecules II: identification and computation of inaccessible cavities inside proteins", journal = "Proteins", volume = "33", year = "1998", pages = "18-29", } @Article{Liang98c, author = "J. Liang and H. Edelsbrunner and and C. Woodward", year = "1998", title = "Anatomy of protein pockets and cavities: Measurement of binding site geometry and implications for ligand design", journal = "Protein Science", volume = "7", pages = "1884-1897", } @Article{Edelsbrunner98, author = "H. Edelsbrunner and M. Facello and J. Liang", title = "On the definition and the construction of pockets in macromolecules", journal = "Disc. Appl. Math", volume = "88", pages = "83-102", year = "1998", } @InProceedings{Edelsbrunner95, author = "H. Edelsbrunner and M. Facello and R. Fu and J. Liang", title = "Measuring Proteins and Voids in Proteins", booktitle = "Proceedings of the 28th Annual Hawaii International Conference on Systems Science", year = "1995", pages = "256-264", } @Article{Binkowski03b, author = "T.A. Binkowski and S. Naghibzadeh and J. Liang", title = "{CASTp:} {C}omputed {A}tlas of {S}urface {T}opography of {p}roteins", journal = "Nucleic Acids Res", year = "2003", volume = "31", pages = "3352-3355", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand binding site representation with grids and matching with correlation %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Katchalski-Katzir92, author = "E. Katchalski-Katzir and I. Shariv and M. Eisenstein and A.A. Friesem and C. Aflalo and I.A. Vakser", title = "Molecular surface recognition: determination of geometric fit between proteins and their ligands by correlation techniques", journal = "Proc. Natl. Acad. Sci. U.S.A", volume = "89", year = "1992", pages = "2195-2199", comment = "Rasterizes molecules into grid. Discretely samples rotations. Uses correlation in Fourier domain to search for best translation.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Representation of binding sites with flexible structures %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Pitman01, title = "{FLASHFLOOD:} A {3D} field-based similarity search and alignment method for flexible molecules", author = "M.C. Pitman and W.K. Huber and H. Horn and A. Kramer and J.E. Rice and W.C. Swope", journal = "J Comput Aided Mol Des", year = "2001", month = "July", volume = "15", number = "7", pages = "587-612", comment = "This is Wolfgang's paper" } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand binding site mapping with probes %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Goodford85, author = "P.J. Goodford", title = "A computational procedure for determining energetically favorable binding sites on biologically important macromolecules", journal = "J. Med. Chem.", volume = "28", year = "1985", pages = "849-857", comment = "Uses GRID", } @Article{Kastenholz00, author = "M.A. Kastenholz and M. Pastor and G. Cruciani and E.E. Haaksma and T. Fox", title = "{GRID/CPCA:} a new computational tool to design selective ligands", journal = "J Med Chem", volume = "43", year = "2000", pages = "3033-3044", comment = "Uses GRID to understand similarities/differences between binding sites", } @Article{Reynolds89, author = "C.A. Reynolds and R.C. Wade and P.J. Goodford", title = "Identifying targets for bioreductive agents: using GRID to predict selective binding regions of proteins", journal = "J Mol Graph.", volume = "7", number = "2", month = "Jun", year = "1989", pages = "103-108" } @Article{Ruppert97, author = "J. Ruppert and W. Welch and A. Jain", title = "Automatic identification and representation of protein binding sites for molecular docking", journal = "Protein Science", volume = "6", year = "1997", pages = "524-533", comment = "This paper presents an algorithm for representing a protein's binding site in a way that is specifically suited to molecular docking applications. Initially the protein's surface is coated with a collection of molecular fragments that could potentially interact with the protein. Each fragment, or probe, serves as a potential alignment point for atoms in a ligand, and is scored to represent that probe's affinity for the protein. Probes are then clustered by accumulating their affinities, where high affinity clusters are identified as being the ``stickiest'' portions of the protein surface. The stickiest cluster is used as a computational binding ``pocket'' for docking.", } @Article{Pastor97, author = "Manuel Pastor and Gabriele Cruciani and Kimberly A. Watson", title = "A Strategy for the Incorporation of Water Molecules Present in a Ligand Binding Site into a Three-Dimensional Quantitative Structure-Activity Relationship Analysis", journal = "J. Med. Chem", year = "1997", volume = "40", number = "25", pages = "4089-4102", comment = "Uses GRID descriptors input in statistical procedures like CoMFA, GOLPE or SIMCA for QSAR or 3D-QSAR analyses", } @Misc{GRID, author = {Molecular Discovery}, title = "GRID", howpublished = {http://www.moldiscovery.com/soft\_grid.php}, year = "2005", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand binding site mapping with probe/fragment docking/simultation %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Mattos96, author = "Carla Mattos and Dagmar Ringe", title = "Locating and characterizing binding sites on proteins", journal = "Nature Biotechnology", volume = "14", year = "1996", pages = "595-599", comment = "``This review article begins with a discussion of fundamental differences between substrates and inhibitors, and some of the assumptions and goals underlying the design of a new ligand to a target protein. An overview is given of the methods currently used to locate and characterize ligand binding sites on protein surfaces, with focus on a novel approach: multiple solvent crystal structures (MSCS). In this method, the X-ray crystal structure of the target protein is solved in a variety of organic solvents. Each type of solvent molecule serves as a probe for complementary binding sites on the protein. The probe distribution on the protein surface allows the location of binding sites and the characterization of the potential ligand interactions within these sites. General aspects of the application of the MSCS method to porcine pancreatic elastase is discussed, and comparison of the results with those from X-ray crystal structures of elastase/inhibitor complexes is used to illustrate the potential of the method in aiding the process of rational drug design.''", } @Article{Miranker91, author = "A. Miranker and M. Karplus", title = "Functionality maps of binding sites: a multiple copy simultaneous search method", journal = "Proteins", volume = "11", year = "1991", pages = "29-34", comment = "This is the main reference for the multiple copy simultaneous search (MCSS) method. ``A new method is proposed for determining energetically favorable positions and orientations for functional groups on the surface of proteins with known three-dimensional structure. From 1,000 to 5,000 copies of a functional group are randomly placed in the site and subjected to simultaneous energy minimization and/or quenched molecular dynamics. The resulting functionality maps of a protein receptor site, which can take account of its flexibility, can be used for the analysis of protein ligand interactions and rational drug design. Application of the method to the sialic acid binding site of the influenza coat protein, hemagglutinin, yields functional group minima that correspond with those of the ligand in a cocrystal structure.''", } @Article{Stultz99, author = "C.M. Stultz and Martin Karplus", title = "{MCSS} Functionality Maps for a Flexible Protein", journal = "Proteins, Structure Function and Gentetics", volume = "37", year = "1999", pages = "512-529", } @Book{Evensen97, author = "E. Evensen and D. {Joseph-McCarthy} and M. Karplus", title = "MCSS version 2.1", publisher = "Harvard University", location = "Cambridge, MA USA", year = "1997", } @Article{Caflisch93, author = "A. Caflisch and A. Miranker and M. Karplus", title = "Multiple copy simultaneous search and construction of ligands in binding sites: application to inhibitors of HIV-1 aspartic proteinase", journal = "J. Med. Chem.", volume = "36", pages = "2142-2167", year = "1993", } @Article{Dennis02, author = "Sheldon Dennis and Tamas Kortvelyesi and Sandor Vajda", title = "Computational mapping identifies the binding sites of organic solvents on proteins", journal = "PNAS", month = "April", year = "2002", volume = "99", number = "7", pages = "4290-4295", abstract = "Computational mapping places molecular probes—small molecules or functional groups on a protein surface to identify the most favorable binding positions. Although x-ray crystallography and NMR show that organic solvents bind to a limited number of sites on a protein, current mapping methods result in hundreds of energy minima and do not reveal why some sites bind molecules with different sizes and polarities. We describe a mapping algorithm that explains the origin of this phenomenon. The algorithm has been applied to hen egg-white lysozyme and to thermolysin, interacting with eight and four different ligands, respectively. In both cases the search finds the consensus site to which all molecules bind, whereas other positions that bind only certain ligands are not necessarily found. The consensus sites are pockets of the active site, lined with partially exposed hydrophobic residues and with a number of polar residues toward the edge. These sites can accommodate each ligand in a number of rotational states, some with a hydrogen bond to one of the nearby donoracceptor groups. Specific substrates and/or inhibitors of hen egg-white lysozyme and thermolysin interact with the same side chains identified by the mapping, but form several hydrogen bonds and bind in unique orientations.", } @Article{Silberstein03, author = "Michael Silberstein and Sheldon Dennis and Lawrence {Brown III} and Tamas Kortvelyesi and Karl Clodfelter and Sandor Vajda", title = "Identification of Substrate Binding Sites in Enzymes by Computational Solvent Mapping", journal = "J. Mol. Biol.", volume = "332", year = "2003", pages = "1095-1113", comment = "Docks many small molecule fragments and then predicts that active residues are the ones closest to the docked positions of the fragments", } @Article{Kortvelyesi03, author = "T. Kortvelyesi and M. Silberstein and S. Dennis and S. Vajda", title = "Improved mapping of protein binding sites", journal = "J Comput Aided Mol Des", volume = "17", year = "2003", pages = "173-186", } @Article{Bliznyuk99, author = "A. Bliznyuk and J. Gready", title = "Simple method for locating possible ligand binding sites on protein surfaces", journal = "J. Comput. Chem.", volume = "9", year = "1999", pages = "983-988", comment = "Uses FFT to dock rigid ligand using a simple shape correlation function in order to find the correct binding site, which will later be analyzed by more detailed (energetic) docking methods.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand binding site mapping with knowledge-based algorithms %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Evers03, author = "A. Evers and H.Gohlke and G. Klebe", title = "Ligand-supported Homology Modelling of Protein Binding-sites using Knowledge-based Potentials", journal = "J. Mol. Biol.", year = "2003", volume = "334", pages = "327-345", abstract = "A new approach, MOBILE, is presented that models protein binding-sites including bound ligand molecules as restraints. Initially generated, homology models of the target protein are refined iteratively by including information about bioactive ligands as spatial restraints and optimising the mutual interactions between the ligands and the binding-sites. Thus optimised models can be used for structure-based drug design and virtual screening. In a first step, ligands are docked into an averaged ensemble of crude homology models of the target protein. In the next step, improved homology models are generated, considering explicitly the previously placed ligands by defining restraints between protein and ligand atoms. These restraints are expressed in terms of knowledge-based distance-dependent pair potentials, which were compiled from crystallographically determined protein-ligand complexes. Subsequently, the most favourable models are selected by ranking the interactions between the ligands and the generated pockets using these potentials. Final models are obtained by selecting the best-ranked side-chain conformers from various models, followed by an energy optimisation of the entire complex using a common force-field. Application of the knowledge-based pair potentials proved efficient to restrain the homology modelling process and to score and optimise the modelled protein-ligand complexes. For a test set of 46 protein-ligand complexes, taken from the Protein Data Bank (PDB), the success rate of producing near-native binding-site geometries (rmsd , 2.0 A ° ) with MODELLER is 70\% when the ligand restrains the homology modelling process in its native orientation. Scoring these complexes with the knowledge-based potentials, in 66\% of the cases a pose with rmsd ,2.0 A ° is found on rank 1. Finally, MOBILE has been applied to two case studies modelling factor Xa based on trypsin and aldose reductase based on aldehyde reductase.", } @Article{Sotriffer02a, author = "C. Sotriffer and G. Klebe", title = "Identification and mapping of smallmolecule binding sites in proteins: computational tools for structure-based drug design", journal = "Farmaco", volume = "57", year = "2002", pages = "243-251", } @Article{Verdonk01, author = "M.L. Verdonk and J.C. Cole and P. Watson and V. Gillet and P. Willett", title = "Superstar: improved knowledge-based interaction fields for protein binding sites", journal = "Journal of Molecular Biology ", volume = "307", number = "3", month = "Mar", year = "2001", pages = "841-859", } @Article{Laskowski96, author = "R.A. Laskowski and J.M. Thornton and C. Humblet and J. Singh", title = "{X-SITE:} use of empirically derived atomic packing preferences to identify favourable interaction regions in the binding sites of proteins", journal = "J. Mol. Biol", volume = "259", pages = "175-201", year = "1996", comment = "This is the main reference for XSITE", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand binding site representations with strings %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Karlin96, author = "S. Karlin and and Z.Y. Zhu", title = "Characterizations of diverse residue clusters in protein three-dimensional structures", journal = "Proc Natl Acad Sci U S A", volume = "93", year = "1996", pages = "8344-8349", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand docking overviews %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Halperin02, author = "I. Halperin and B. Ma and Haim Wolfson and Ruth Nussinov", title = "Principles of Docking: An Overview of Search Algorithms and a Guide to Scoring Functions", journal = "Proteins: Structure, Function, and Genetics", volume = "47", pages = "409-443", year = "2002", } @Article{Taylor02b, author = "R.D. Taylor and P.J. Jewsbury and J.W. Essex", title = "A review of protein-small molecule docking methods", journal = "Journal of Computer-Aided Molecular Design", volume = "16", pages = "151-166", year = "2002", } @Article{Krovat05, author = "E.M. Krovat and T. Steindl and T. Langer", title = "Recent Advances in Docking and Scoring", journal = "Current Computer-Aided Drug Design", volume = "1", number = "1", year = "2005", pages = "93-102", abstract = "This review is focused on recent advances and new aspects in the field of molecular docking and scoring, and it covers multiple applications and case studies. Basic requirements and different algorithms for docking are briefly discussed. Moreover, parameters that influence docking results, combination of different docking algorithms and scoring functions, performance of scoring functions, docking using homology models, and ligand and protein flexibility are examined to give an overview of the state-of-the-art methods and a survey of innovative approaches in molecular docking and scoring. Regarding the enormous amount of literature in this field we restrict ourselves on an overview of several important advances in docking and scoring techniques published within the last two years, i.e. we considered publications ranging from 2002 to 2004.", } @Article{Brooijmans03, author = "N. Brooijmans and I.D. Kuntz", title = "Molecular recognition and docking algorithms", journal = "Annu Rev Biophys Biomol Struct", volume = "32", year = "2003", pages = "335-373", abstract = "Molecular docking is an invaluable tool in modern drug discovery. This review focuses on methodological developments relevant to the field of molecular docking. The forces important in molecular recognition are reviewed and followed by a discussion of how different scoring functions account for these forces. More recent applications of computational chemistry tools involve library design and database screening. Last, we summarize several critical methodological issues that must be addressed in future developments.", } @Article{Kroemer03, author = "R.T. Kroemer", title = "Molecular modelling probes: docking and scoring", journal = "Biochemical Society Transactions", year = "2003", volume = "31", number = "5", pages = "980-984", abstract = "A general introduction to molecular modelling techniques in the area of protein-ligand interactions is given. Methods covered range from binding-site analysis to statistical treatment of sets of ligands. The main focus of this paper is on docking and scoring. After an outline of the main concepts, two specific application examples are given.", } @Article{Kitchen04, author = "D.B. Kitchen and H. Decornez and J.R. Furr and J.D.B. Bajorath", title = "Docking and scoring in virtual screening for drug discovery: methods and applications", journal = "Nature Rev. Drug Discov.", volume = "3", number = "11", pages = "935-949", year = "2004", abstract = "Computational approaches that 'dock' small molecules into the structures of macromolecular targets and 'score' their potential complementarity to binding sites are widely used in hit identification and lead optimization. Indeed, there are now a number of drugs whose development was heavily influenced by or based on structure-based design and screening strategies, such as HIV protease inhibitors. Nevertheless, there remain significant challenges in the application of these approaches, in particular in relation to current scoring schemes. Here, we review key concepts and specific features of small-molecule-protein docking methods, highlight selected applications and discuss recent advances that aim to address the acknowledged limitations of established approaches.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand docking with Monte Carlo simulated annealing %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Friesner04, author = "R.A. Friesner and J.L. Banks and R.B. Murphy and T.A. Halgren and J.J. Klicic and D.T. Mainz and M.P. Repasky and E.H. Knoll and M. Shelley and J.K. Perry and D.E. Shaw and P. Francis and P.S. Shenkin", title = "Glide: A New Approach for Rapid, Accurate Docking and Scoring. {1. M}ethod and Assessment of Docking Accuracy", journal = "J. Med. Chem", year = "2004", volume = "47", pages = "1739-1749", comment = "This is the main reference for GLIDE", } @Article{Liu99, author = "M. Liu and S. Wang", title = "{MCDOCK:} A Monte Carlo simulation approach to the molecular docking problem", journal = "Journal of Computer-Aided Molecular Design", volume = "13", number = "5", year = "1999", pages = "435-451", comment = "This is the main reference for MCDock.", } @Article{Goodsell90, author = "D.S. Goodsell and A.J. Olson", title = "Automated Docking of Substrates to Proteins by Simulated Annealing", journal = "Proteins: Str. Func. and Genet.", volume = "8", year = "1990", pages = "195-202", comment = "This is the main reference for AutoDock 1.0.", } @Article{Mcmartin97, author = "C. Mcmartin and R.S. Bohacek", title = "{QXP:} Powerful, rapid computer algorithms for structure-based drug design", journal = "Journal of Computer-Aided Molecular Design", volume = "11", number = "4", year = "1997", pages = "333-344", comment = "This is the main reference for QXP.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand docking with genetic algorithms %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Jones97, author = "G. Jones and P. Willett and R.C. Glen and A.R. Leach and R. Taylor", title = "Development and Validation of a Genetic Algorithm for Flexible Docking", journal = "J. Mol. Biol.", volume = "267", year = "1997", pages = "727-748", comment = "This is the main reference for GOLD." } @Article{Verdonk03, author = "M.L. Verdonk and J.C. Cole and M.J. Hartshorn and C.W. Murray and R. D. Taylor", title = "Improved Protein-Ligand Docking Using GOLD", journal = "Proteins", volume = "52", year = "2003", pages = "609-623", comment = "This is a more recent paper about GOLD.", } @Article{Morris98, author = "G.M. Morris and D.S. Goodsell and R.S. Halliday and R. Huey and W.E. Hart and R.K. Belew and A.J. Olson", title = "Automated Docking Using a Lamarckian Genetic Algorithm and and Empirical Binding Free Energy Function", journal = "J. Computational Chemistry", volume = "19", year = "1998", pages = "1639-1662", comment = "This is the main reference for AutoDock 3.0 (http://www.scripps.edu/mb/olson/dock/autodock/).", } @Article{Oshiro95, author = "C.M. Oshiro and I.D. Kuntz", title = "Flexible ligand docking using a genetic algorithm", journal = "J. Comput-Aided Mol. Design", volume = "9", pages = "113-130", year = "1995", comment = "DOCK", } @Article{Yang04, author = "J.M. Yang and C.C. Chen", title = "{GEMDOCK:} A generic evolutionary method for molecular docking", journal = "Proteins: Structure, Function, and Bioinformatics", year = "2004", pages = "288-304", comment = "This is the main reference for GemDock.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand docking with incremental construction %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Rarey96, author = "M. Rarey and B. Kramer and T. Lengauer and G. Klebe", year = "1996", title = "A Fast Flexible Docking Method using an Incremental Construction Algorithm", journal = "Journal of Molecular Biology", volume = "261", number = "3", pages = "470-489", comment = "This is the main reference for FlexX (http://www.biosolveit.de/FlexX/).", } @Article{Zavodsky02, author = "M.I. Zavodszky and P.C. Sanschagrin and R.S. Korde, and L.A. Kuhn", title = "Distilling the essential features of a protein surface for improving protein-ligand docking, scoring, and virtual screening", journal = "J. Comput. Aided Mol. Des.", volume = "16", year = "2002", pages = "883-902", comment = "This is the main reference for SLIDE.", } @Article{Jain03, author = "A.N. Jain", title = "Surflex: fully automatic flexible molecular docking using a molecular similarity-based search engine", journal = "J Med Chem", volume = "46", year = "2003", pages = "499-511", comment = "This is the main reference for Surflex.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand docking with systematic search %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Misc{FRED, author = "{Open Eye Scientific Software}", title = "{FRED:} Fast Rigid Exhaustive Docking", howpublished = "http://www.eyesopen.com/docs/html/fred/", comment = "This is the main reference for FRED.", year = "2005", comment = "This is the main reference for FRED, which docks ligands in proteins using precomputed ligand conformations and systematic search over translations and rotations.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand docking with tabu search methods %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Baxter97, author = "C.A. Baxter and C.W. Murray and D.E. Clark and D.R. Westhead and M.D. Eldridge", title = "Flexible docking using TABU search and an empirical estimate of binding affinity", journal = "Proteins", volume = "33", year = "1997", pages = "367-382", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand docking with multiconformers %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{McGann03, author = "M. McGann and H. Almond and A. Nicholls and J.A. Grant and F. Brown", title = "Gaussian Docking Functions", journal = "Biopolymers", volume = "68", year = "2003", pages = "76-90", comment = "FRED", } @InProceedings{Choi05, author = "V. Choi", title = "Yucca: An Efficient Algorithm for Small Molecule Docking", booktitle = "Algorithms in Molecular Biology ({AlgBio2005})", year = "2005", pages = "to appear", comment = "This is the main reference for Yucca.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand docking by consensus %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Paul02, author = "N. Paul and D. Rognan", title = "{ConsDock:} A new program for the consensus analysis of protein-ligand interactions", journal = "Proteins", volume = "47", number = "4", year = "2002", pages = "521-533", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand docking with ... %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Kuntz82, author = "I.D. Kuntz and J.M. Blaney and S.J. Oatley and R. Langridge and T.E. Ferrin", title = "A geometric approach to macromolecule-ligand interactions", journal = "J. Mol. Biol", volume = "161", year = "1982", pages = "269-288", comment = "This is the main reference for the first docking program (Dock 1.0).", } @Article{Jackson02, author = "R.M. Jackson", title = "{Q-fit:} a probabilistic method for docking molecular fragments by sampling low energy conformational space", journal = "J Comput Aided Mol Des", volume = "16", pages = "43-57", year = "2002", } @Article{Welch96, author = "W. Welch and J. Ruppert and A.N. Jain", title = "Hammerhead: fast, fully automated docking of flexible ligands to protein binding sites", journal = "Chemistry \& Biology", volume = "3", number = "6", year = "1996", pages = "449-462", comment = "This is the main reference for Hammerhead.", abstract = "Background: Molecular docking seeks to predict the geometry and affinity of the binding of a small molecule to a given protein of known structure. Rigid docking has long been used to screen databases of small molecules, because docking techniques that account for ligand flexibility have either been too slow or have required significant human intervention. Here we describe a docking algorithm, Hammerhead, which is a fast, automated tool to screen for the binding of flexible molecules to protein binding sites.Results: We used Hammerhead to successfully dock a variety of positive control ligands into their cognate proteins. The empirically tuned scoring function of the algorithm predicted binding affinities within 1.3 log units of the known affinities for these ligands. Conformations and alignments close to those determined crystallographically received the highest scores. We screened 80 000 compounds for binding to streptavidin, and biotin was predicted as the top-scoring ligand, with other known ligands included among the highest-scoring dockings. The screen ran in a few days on commonly available hardware.Conclusions: Hammerhead is suitable for screening large databases of flexible molecules for binding to a protein of known structure. It correctly docks a variety of known flexible ligands, and it spends an average of only a few seconds on each compound during a screen. The approach is completely automated, from the elucidation of protein binding sites, through the docking of molecules, to the final selection of compounds for assay.", } @Article{Abagyan94, author = "R. Abagyan and M. Totrov and D. Kuznetsov", title = "ICM - A new method for protein modeling and design: Applications to docking and structure prediction from the distorted native conformation", journal = "Journal of Computational Chemistry", volume = "15", number = "5", year = "1994", pages = "488-506", comment = "This is the main reference for ICM", } @Article{Schoichet92, author = "B.K. Shoichet and D.L. Bodian and I.D. Kuntz", title = "Molecular docking using shape descriptors", journal = "J. Comp. Chem.", volume = "13", number = "3", year = "1992", pages = "380-397", comment = "DOCK", } @Article{Meng92, author = "E.C. Meng and B.K. Shoichet and I.D. Kuntz", title = "Automated docking with grid-based energy evaluation", journal = "J. Comp. Chem.", volume = "13", year = "1992", pages = "505-524", comment = "DOCK (http://www.cmpharm.ucsf.edu/kuntz/dockinfo.html)", } @Article{Meng93, author = "E.C. Meng and D.A. Gschwend and J.M. Blaney and I.D. Kuntz", title = "Orientational sampling and rigid-body minimization in molecular docking", journal = "Proteins", volume = "17", number = "3", pages = "266-278", year = "1993", comment = "DOCK", } @Article{Gschwend96, author = "D.A. Gschwend and I.D. Kuntz", title = "Orientational sampling and rigid-body minimization in molecular docking, revisited: On-the-fly optimization and degeneracy removal", journal = "J. Comput-Aided Mol. Design", year = "1996", comment = "DOCK", } @Article{Shoichet93, author = "B.K. Shoichet and I.D. Kuntz", title = "Matching chemistry and shape in molecular docking", journal = "Protein Engineering", volume = "6", year = "1993", pages = "223-232", comment = "DOCK", } @Article{Ewing01, author = "T.J.A. Ewing and S. Makino and A.G. Skillman and I.D. Kuntz", title = "{Dock 4.0:} Search strategies for automated molecular docking of flexible molecule databases", journal = "J. Comp. Aided Mol. Design", volume = "15", year = "2001", pages = "411-428", comment = "This is the main reference for Dock 4.0.", } @Article{Roche01, author = "O. Roche and R. Kiyama and C.L. {Brooks, III}", title = "Ligand-protein database: Linking protein-ligand complex structures to binding data", journal = "J. Med. Chem.", volume = "44", year = " 2001", pages = "3592-3598", } @Article{Marai04, author = "C. Marai", title = "Accommodating Protein Flexibility in Computational Drug Design", journal = "Mol Pharmacol", volume = "57", number = "2", year = "2004", pages = "213-218", } @Article{Meiler06, author = "J. Meiler and D. Baker", year = "2006", title = "{ROSETTALIGAND:} Protein-small molecule docking with full side-chain flexibility", journal = "Proteins", volume = "(Electronic)" pages = "1097-0134", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand docking evaluations %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Kellenberger04, author = "E. Kellenberger and J. Rodrigo and P. Muller and D. Rognan", title = "Comparative evaluation of eight docking tools for docking and virtual screening accuracy", journal = "Proteins", volume = "57", number = "2", year = "2004", pages = "225-242", } @Article{Kontoyianni04a, author = "M. Kontoyianni and L.M. McClellan et al.", title = "Evaluation of Docking Performance: Comparative Data on Docking Algorithms", journal = "J Med Chem", volume = "47", number = "3", year = "2004", pages = "558-565", abstract = "Docking molecules into their respective 3D macromolecular targets is a widely used method for lead optimization. However, the best known docking algorithms often fail to position the ligand in an orientation close to the experimental binding mode. It was reported recently that consensus scoring enhances the hit rates in a virtual screening experiment. This methodology focused on the top-ranked pose, with the underlying assumption that the orientation/conformation of the docked compound is the most accurate. In an effort to eliminate the scoring function bias, and assess the ability of the docking algorithms to provide solutions similar to the crystallographic modes, we investigated the most known docking programs and evaluated all of the resultant poses. We present the results of an extensive computational study in which five docking programs (FlexX, DOCK, GOLD, LigandFit, Glide) were investigated against 14 protein families (69 targets). Our findings show that some algorithms perform consistently better than others, and a correspondence between the nature of the active site and the best docking algorithm can be found." } @Article{Kontoyianni04b, author = "M. Kontoyianni and G.S. Sokol and L.M.McClellan", title = "Evaluation of library ranking efficacy in virtual screening", journal = "Journal of Computational Chemistry", volume = "26", number = "1", year = "2004", pages = "11-22", abstract = "We present the results of a comprehensive study in which we explored how the docking procedure affects the performance of a virtual screening approach. We used four docking engines and applied 10 scoring functions to the top-ranked docking solutions of seeded databases against six target proteins. The scores of the experimental poses were placed within the total set to assess whether the scoring function required an accurate pose to provide the appropriate rank for the seeded compounds. This method allows a direct comparison of library ranking efficacy. Our results indicate that the LigandFit/Ligscore1 and LigandFit/GOLD docking/scoring combinations, and to a lesser degree FlexX/FlexX, Glide/Ligscore1, DOCK/PMF (Tripos implementation), LigandFit1/Ligscore2 and LigandFit/PMF (Tripos implementation) were able to retrieve the highest number of actives at a 10\% fraction of the database when all targets were looked upon collectively. We also show that the scoring functions rank the observed binding modes higher than the inaccurate poses provided that the experimental poses are available. This finding stresses the discriminatory ability of the scoring algorithms, when better poses are available, and suggests that the number of false positives can be lowered with conformers closer to bioactive ones.", } @Article{Perola04, author = "E. Perola and W.P. Walters and P.S. Charifson", title = "A detailed comparison of current docking and scoring methods on systems of pharmaceutical relevance", journal = "Proteins", volume = "56", number = "2", year = "2004", pages = "235-249", abstract = "A thorough evaluation of some of the most advanced docking and scoring methods currently available is described, and guidelines for the choice of an appropriate protocol for docking and virtual screening are defined. The generation of a large and highly curated test set of pharmaceutically relevant protein-ligand complexes with known binding affinities is described, and three highly regarded docking programs (Glide, GOLD, and ICM) are evaluated on the same set with respect to their ability to reproduce crystallographic binding orientations. Glide correctly identified the crystallographic pose within 2.0 Ã… in 61\% of the cases, versus 48\% for GOLD and 45\% for ICM. In general Glide appears to perform most consistently with respect to diversity of binding sites and ligand flexibility, while the performance of ICM and GOLD is more binding site-dependent and it is significantly poorer when binding is predominantly driven by hydrophobic interactions. The results also show that energy minimization and reranking of the top N poses can be an effective means to overcome some of the limitations of a given docking function. The same docking programs are evaluated in conjunction with three different scoring functions for their ability to discriminate actives from inactives in virtual screening. The evaluation, performed on three different systems (HIV-1 protease, IMPDH, and p38 MAP kinase), confirms that the relative performance of different docking and scoring methods is to some extent binding site-dependent. GlideScore appears to be an effective scoring function for database screening, with consistent performance across several types of binding sites, while ChemScore appears to be most useful in sterically demanding sites since it is more forgiving of repulsive interactions. Energy minimization of docked poses can significantly improve the enrichments in systems with sterically demanding binding sites. Overall Glide appears to be a safe general choice for docking, while the choice of the best scoring tool remains to a larger extent system-dependent and should be evaluated on a case-by-case basis.", } @Article{Warren05, author = "G.L. Warren and C.W. Andrews and A.M. Capelli and B. Clarke and J. LaLonde and M.H. Lambert and M. Lindvall and N. Nevins and S.F. Semus and S. Senger and G. Tedesco and I.D. Wall and J.M. Woolven and C.E. Peishoff and M.S. Head", title = "A critical assessment of docking programs and scoring functions", journal = "J. Med. Chem.", volume = "ASAP Article 10.1021/jm050362n", month = "August", year = "2005", abstract = "Docking is a computational technique that samples conformations of small molecules in protein binding sites; scoring functions are used to assess which of these conformations best complements the protein binding site. An evaluation of 10 docking programs and 37 scoring functions was conducted against eight proteins of seven protein types for three tasks: binding mode prediction, virtual screening for lead identification, and rank-ordering by affinity for lead optimization. All of the docking programs were able to generate ligand conformations similar to crystallographically determined protein/ligand complex structures for at least one of the targets. However, scoring functions were less successful at distinguishing the crystallographic conformation from the set of docked poses. Docking programs identified active compounds from a pharmaceutically relevant pool of decoy compounds; however, no single program performed well for all of the targets. For prediction of compound affinity, none of the docking programs or scoring functions made a useful prediction of ligand binding affinity.", } @Article{Erickson04, author = "J.A. Erickson and M. Jalaie and D.H. Robertson and R.A. Lewis and M. Vieth", title = "Lessons in Molecular Recognition: The Effects of Ligand and Protein Flexibility on Molecular Docking Accuracy", journal = "J. Med. Chem.", volume = "47", number = "1", year = "2004", pages = "45 -55", abstract = "The key to success for computational tools used in structure-based drug design is the ability to accurately place or dock a ligand in the binding pocket of the target of interest. In this report we examine the effect of several factors on docking accuracy, including ligand and protein flexibility. To examine ligand flexibility in an unbiased fashion, a test set of 41 ligand-protein cocomplex X-ray structures were assembled that represent a diversity of size, flexibility, and polarity with respect to the ligands. Four docking algorithms, DOCK, FlexX, GOLD, and CDOCKER, were applied to the test set, and the results were examined in terms of the ability to reproduce X-ray ligand positions within 2.0Å heavy atom root-mean-square deviation. Overall, each method performed well (>50\% accuracy) but for all methods it was found that docking accuracy decreased substantially for ligands with eight or more rotatable bonds. Only CDOCKER was able to accurately dock most of those ligands with eight or more rotatable bonds (71\% accuracy rate). A second test set of structures was gathered to examine how protein flexibility influences docking accuracy. CDOCKER was applied to X-ray structures of trypsin, thrombin, and HIV-1-protease, using protein structures bound to several ligands and also the unbound (apo) form. Docking experiments of each ligand to one average structure and to the apo form were carried out, and the results were compared to docking each ligand back to its originating structure. The results show that docking accuracy falls off dramatically if one uses an average or apo structure. In fact, it is shown that the drop in docking accuracy mirrors the degree to which the protein moves upon ligand binding.", } @Article{Zavodszky05, author = "M.I. Zavodszky and L. Kuhn", title = "Lessons from Docking Validation", journal = "submitted for publication", year = "2005", url = "http://www.bch.msu.edu/labs/kuhn/web/publication_papers/pdf/Zavodszky_Kuhn_JMedChem_2005.pdf", } @Article{Bursulaya03, author = "B.D. Bursulaya and M. Totrov and R. Abagyan and C.L. {Brooks, III}", title = "Comparative study of several algorithms for flexible ligand docking", journal = "J Comput. Aided Mol. Des", volume = "17", year = "2003", pages = "755-763", } @Article{Nissink02, author = "J.W.M. Nissink and C. Murray and M. Hartshorn and M.L. Verdonk and J.C. Cole and R. Taylor", title = "A new test set for validating predictions of protein-ligand interaction", journal = "Proteins", volume = "49", number = "4", year = "2002", pages = "457-471", } @Article{Bissantz00, author = "C. Bissantz and G. Folkers and D. Rognan", title = "Protein-based virtual screening of chemical databases. 1. Evaluation of different docking/scoring combinations", journal = "J. Med. Chem.", volume = "43", year = "2000", pages = "4759-4767", abstract = "Three different database docking programs (Dock, FlexX, Gold) have been used in combination with seven scoring functions (Chemscore, Dock, FlexX, Fresno, Gold, Pmf, Score) to assess the accuracy of virtual screening methods against two protein targets (thymidine kinase, estrogen receptor) of known three-dimensional structure. For both targets, it was generally possible to discriminate about 7 out of 10 true hits from a random database of 990 ligands. The use of consensus lists common to two or three scoring functions clearly enhances hit rates among the top 5\% scorers from 10\% (single scoring) to 25-40\% (double scoring) and up to 65-70\% (triple scoring). However, in all tested cases, no clear relationships could be found between docking and ranking accuracies. Moreover, predicting the absolute binding free energy of true hits was not possible whatever docking accuracy was achieved and scoring function used. As the best docking/consensus scoring combination varies with the selected target and the physicochemistry of target-ligand interactions, we propose a two-step protocol for screening large databases: (i) screening of a reduced dataset containing a few known ligands for deriving the optimal docking/consensus scoring scheme, (ii) applying the latter parameters to the screening of the entire database.", } @Article{Perez01, author = "C. Perez and A.R. Ortiz", title = "Evaluation of docking functions for protein-ligand docking", journal = "J. Med. Chem.", volume = "44", year = "2001", pages = "3768-3785", } @Article{Vieth98a, author = "M. Vieth and J. Hirst and B.N. Dominy and H. Daigler and C.L. {Brooks, III}", title = "Assessing search strategies for flexible docking", journal = "J. Comput. Chem.", volume = "19", year = "1998", pages = "1623-1631", } @Article{Ha00, author = "S. Ha and R. Andreani and A. Robbins and I. Muegge", title = "Evaluation of docking/scoring approaches: A comparative study based on {MMP3} inhibitors", journal = "Journal of Computer-Aided Molecular Design", volume = "14", number = "5", year = "2000", pages = "435-448", abstract = "An increasing number of docking/scoring programs are available that use different sampling and scoring algorithms. A reliable scoring function is the crucial element of such approaches. Comparative studies are needed to evaluate their current capabilities. DOCK4 with force field and PMF scoring as well as FlexX were used to evaluate the predictive power of these docking/scoring approaches to identify the correct binding mode of 61 MMP-3 inhibitors in a crystal structure of stromelysin and also to rank them according to their different binding affinities. It was found that DOCK4/PMF scoring performs significantly better than FlexX and DOCK4/FF in both ranking ligands and predicting their binding modes. Most notably, DOCK4/PMF was the only scoring/docking approach that found a significant correlation between binding affinity and predicted score of the docked inhibitors. However, comparing only those cases where the correct binding mode was identified (scoring highest among sampled poses), FlexX showed the best `fine tuning' (lowest rmsd) in predicted binding modes. The results suggest that not so much the sampling procedure but rather the scoring function is the crucial element of a docking program.", } @Article{Schulz-Gasch03, author = "T. Schulz-Gasch and M. Stahl", title = "Binding site characteristics in structure-based virtual screening: evaluation of current docking tools", journal = "Journal of Molecular Modeling", volume = "9", number = "1", year = "2003", pages = "47-57", abstract = "Two new docking programs FRED (OpenEye Scientific Software) and Glide (Schrödinger, Inc.) in combination with various scoring functions implemented in these programs have been evaluated against a variety of seven protein targets (cyclooxygenase-2, estrogen receptor, p38 MAP kinase, gyrase B, thrombin, gelatinase A, neuraminidase) in order to assess their accuracy in virtual screening. Sets of known inhibitors were added to and ranked relative to a random library of drug-like compounds. Performance was compared in terms of enrichment factors and CPU time consumption. Results and specific features of the two new tools are discussed and compared to previously published results using FlexX (Tripos, Inc.) as a docking engine. In addition, general criteria for the selection of docking algorithms and scoring functions based on binding-site characteristics of specific protein targets are proposed.", } @Article{Merlitz02, author = "H. Merlitz and W. Wenzel", title = "Comparison of stochastic optimization methods for receptor-ligand docking", journal = "Chemical Physics Letters", volume = "362", number = "3", year = "2002", pages = "271-277", abstract = "We compare the efficiency of three stochastic optimization methods, simulated annealing, parallel tempering and stochastic tunneling to locate the global minima of complex and rugged potential energy surfaces arising from atomistic models for receptor-ligand docking. The stochastic tunneling method proves to be the most efficient generic approach for atomistic receptor-ligand docking in the rigid ligand - rigid receptor approximation.", } @Article{McConkey02, author = "B. McConkey and V. Sobolev and M. Edelman", title = "The performance of current methods in ligand-protein docking", journal = "Current Science", volume = "83", number = "7", year = "2002", pages = "845-856", abstract = "Computer-based methods for predicting the structure of ligand-protein complexes or docking algorithms have application in both drug design and the elucidation of biochemical pathways. The number of solved structures of ligand-protein complexes now permits the testing and validation of docking algorithms, by comparison of predicted complexes with structures extracted from protein databases. This paper outlines the methodologies and compares their performance in predicting the structure of ligand-protein complexes.", } @Article{Cummings05, author = "M.D. Cummings and R.L. DesJarlais and A.C. Gibbs and V. Mohan and E.P. Jaeger", title = "Comparison of Automated Docking Programs as Virtual Screening Tools", journal = "J. Med. Chem.", year = "2005", volume = "48", pages = "962-976", comment = "Related to data set provided by Joe Corkery", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand scoring overviews %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Gohlke02, author = "H.Gohlke and G. Klebe", title = "Approaches to the description and prediction of the binding affinity of small-molecule ligands to macromolecular receptors", journal = "Angew. Chem., Int. Ed.", volume = "41", year = "2002", pages = "2644-2676", } @InCollection{Buhm02, author = "H.J. Buhm and M. Stahl", title = "The use of scoring functions in drug discovery applications", booktitle = "Reviews in Computational Chemistry", publisher = "Wiley-VCH", location = "New York", volume = "18", year = "2002", pages = "41-87", } @Article{Tame05, author = "J. Tame", title = "Scoring Functions -- the First 100 Years", journal = "Journal of Computer-Aided Molecular Design", volume = "19", number = "6", month = "June", year = "2005", pages = "445-451", abstract = "The use of simple linear mathematical models to estimate chemical properties is not a new idea. Albert Einstein used very simple ‘gravity-like' forces to explain the capillarity of different liquids in 1900-1901. Today such models are used in more complicated situations, and a great many have been developed to analyse interactions between proteins and their ligands. This is not surprising, since proteins are too complicated to model accurately without lengthy numerical analysis, and simple models often do at least as good a job in predicting binding constants as much more computationally expensive methods. One hundred years after Einstein’s ‘miraculous year’ in which he transformed physics, it is instructive to recall some of his even earlier work. As approximations, ‘scoring functions’ are excellent, but it is dangerous to read too much into them. A few cautionary tales are presented for the beginner to the field of ligand affinity prediction by linear models.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand scoring force field methods %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Brooks83, author = "Bernhard R. Brooks and Robert E. Bruccoleri and Barry D. Olafson and David J. States and S. Swaminathan and Martin Karplus", title = "{CHARMM:} A program for macromolecular energy, minimization, and dynamics calculations", journal = "J. Comp. Chem", volume = "4", number = "2", pages = "187-217", year = "1983", comment = "This is the main reference for CHARMM.", } @Article{Cornell95, author = "W.D. Cornell and P. Cieplak and C.I. Bayly and I.R. Gould and K.M. {Merz, Jr.} and D.M. Ferguson and D.C. Spellmeyer and T. Fox and J.W. Caldwell and P.A. Kollman", title = "A Second Generation Force Field for the Simulation of Proteins, Nucleic Acids, and Organic Molecules", journal = "Journal of the American Chemical Society", volume = "117", number = "19", year = "1995", pages = "5179-5197", comment = "This is the main reference for AMBER(?)", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand scoring with empirical methods %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Eldridge97, author = "M.D. Eldridge and C.W. Murray and T.R. Auton and G.V. Paolini and R.P. Mee", title = "Empirical scoring functions. {I:} The development of a fast empirical scoring function to estimate the binding affinity of ligands in receptor complexes", journal = "J. Comput.-Aided Mol. Des.", volume = "11", year = "1997", pages = "425-445", comment = "This is the main reference for ChemScore.", } @Article{Boehm94, author = "H.J. Boehm", title = "The development of a simple empirical scoring function to estimate the binding constant for a protein-ligand complex of known three-dimensional structure", journal = "J. Comput.-Aided Mol. Des.", volume = "8", year = "1994", pages = "243-256", } @Article{Buhm98, author = "H.J. Buhm", title = "Prediction of binding constants of protein ligands: A fast method for the prioritization of hits obtained from de novo design or 3d database search programs", journal = "J. Comput.-Aided Mol. Des.", volume = "12", year = "1998", pages = "309-323", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand scoring with knowledge-based methods %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Gohlke00, author = "H. Gohlke and M. Hendlich and G. Klebe", title = "Knowledge-based scoring function to predict protein-ligand interactions", journal = "J. Mol. Biol.", volume = "295", year = "2000", pages = "337-356", comment = "This is the main reference for DrugScore, a knowledge-based scoring method.", } @Article{Mitchell99a, author = "J.B.O. Mitchell and R. Laskowski and A. Alex and J.M. Thornton", title = "{BLEEP} - potential of mean force describing protein-ligand interactions: I. Generating potential", journal = "J. Comput. Chem.", volume = "20", number = "11", year = "1999", pages = "1165-1176", comment = "This is the main reference for BLEEP.", abstract = "We have developed BLEEP (biomolecular ligand energy evaluation protocol), an atomic level potential of mean force (PMF) describing protein-ligand interactions. The pair potentials for BLEEP have been derived from high-resolution X-ray structures of protein-ligand complexes in the Brookhaven Protein Data Bank (PDB), with a careful treatment of homology. The use of a broad variety of protein-ligand structures in the derivation phase gives BLEEP more general applicability than previous potentials, which have been based on limited classes of complexes, and thus represents a significant step forward. We calculate the distance distributions in protein-ligand interactions for all 820 possible pairs that can be chosen from our set of 40 different atom types, including polar hydrogen. We then use a reverse Boltzmann methodology to convert these into energy-like pair potential functions. Two versions of BLEEP are calculated, one including and one excluding interactions between protein and water. The pair potentials are found to have the expected forms; polar and hydrogen bonding interactions show minima at short range, around 3.0 Å, whereas a typical hydrophobic interaction is repulsive at this distance, with values above 4.0 Å being preferred.", } @Article{Mitchell99b, author = "J.B.O. Mitchell and R. Laskowski and A. Alex and J.M. Thornton", title = "{BLEEP} - potential of mean force describing protein-ligand interactions: II. Calculation of binding energies and comparison with experimental data", journal = "J. Comput. Chem.", volume = "20", number = "11", year = "1999", pages = "1177-1185", } @Article{Nobeli01, author = "I. Nobeli and J.B.O. Mitchell and A. Alex and J.M. Thornton", title = "Evaluation of a Knowledge-Based Potential of Mean Force for Scoring Docked Protein-Ligand Complexes", journal = "Journal of Computational Chemistry", volume = "22", number = "7", year = "2001", pages = "673-688", } @Article{Muegge99, author = "I. Muegge and Y.C. Martin", title = "A general and fast scoring function for protein-ligand interactions: A simplified potential approach", journal = "J. Med. Chem.", volume = "42", year = "1999", pages = "791-804", } @Article{Sippl95, author = "M.J. Sippl", title = "Knowledge-based potentials for proteins", journal = "Curr. Opin. Struct. Biol.", volume = "5", year = "1995", pages = "229-235", } @Article{Tanaka76, author = "S. Tanaka and H.A. Scheraga", title = "Medium- and long-range interaction parameters between amino acids for predicting three-dimensional structures of proteins", journal = "Macromolecules", volume = "9", pages = "945-950", comment = "Early paper on data-driven scoring", abstract = "In a previous paper, a hypothesis for protein folding was proposed in which the native structure is formed by a three-step mechanism: (A) formation of ordered backbone structures by short-range interactions, (B) formation of small contact regions by medium-range interactions, and (C) association of the small contact regions into the native structure by long-range interactions. In this paper the empirical interaction parameters, used as a measure of the medium- and long-range interactions (the standard free energy, deltaGdegrees k,l, of formation of a contact between amino acids of species k and l) that include the role of the solvent (water) and determine the conformation of a protein in steps B and C, are evaluated from the frequency of contacts in the x-ray structures of native proteins. The numerical values of deltaG degrees k,l for all possible pairs of the 20 naturally occurring amino acids are presented. Contacts between highly nonpolar side chains of amino acids such as Ile, Phe, Trp, and Leu are shown quantitatively to be stable. On the contrary, contacts involving polar side chains of amino acids such as Ser, Asp, Lys, and Glu are significantly less stable. While this implies, in a quantitative manner, that it is generally more favorable for nonpolar groups to lie in the interior of the protein molecule and for the polar side chains to be exposed to the solvent (water) rather than to form contacts with other amino acids, many exceptions to this generalization are observed.", } @Article{Ge05, author = "W. Ge and B. Schneider and W.K. Olson", title = "Knowledge-Based Elastic Potentials for Docking Drugs or Proteins with Nucleic Acids", journal = "Biophysical Journal", volume = "88", year = "2005", pages = "1166-1190", abstract = "Elastic ellipsoidal functions defined by the observed hydration patterns around the DNA bases provide a new basis for measuring the recognition of ligands in the grooves of double-helical structures. Here a set of knowledge-based potentials suitable for quantitative description of such behavior is extracted from the observed positions of water molecules and amino acid atoms that form hydrogen bonds with the nitrogenous bases in high resolution crystal structures. Energies based on the displacement of hydrogen-bonding sites on drugs in DNA-crystal complexes relative to the preferred locations of water binding around the heterocyclic bases are low, pointing to the reliability of the potentials and the apparent displacement of water molecules by drug atoms in these structures. The validity of the energy functions has been further examined in a series of sequence substitution studies based on the structures of DNA bound to polyamides that have been designed to recognize the minor-groove edges of Watson-Crick basepairs. The higher energies of binding to incorrect sequences superimposed (without conformational adjustment or displacement of polyamide ligands) on observed high resolution structures confirm the hypothesis that the drug subunits associate with specific DNA bases. The knowledge-based functions also account satisfactorily for the measured free energies of DNA-polyamide association in solution and the observed sites of polyamide binding on nucleosomal DNA. The computations are generally consistent with mechanisms by which minor-groove binding ligands are thought to recognize DNA basepairs. The calculations suggest that the asymmetric distributions of hydrogen-bond-forming atoms on the minor-groove edge of the basepairs may underlie ligand discrimination of G·C from C·G pairs, in addition to the commonly believed role of steric hindrance. The analysis of polyamide-bound nucleosomal structures reveals other discrepancies in the expected chemical design, including unexpected contacts to DNA and modified basepair targets of some ligands. The ellipsoidal potentials thus appear promising as a mathematical tool for the study of drug- and protein-DNA interactions and for gaining new insights into DNA-binding mechanisms.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand scoring by consensus %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Charifson99, author = "P.S. Charifson and J.J. Corkery and M.A. Murcko and W.P. Walters", title = "Consensus scoring: A method for obtaining improved hit rates from docking databases of three-dimensional structures into proteins", journal = "J. Med. Chem.", volume = "42", year = "1999", pages = "5100-5109", } @Article{Clark02, author = "R.D. Clark and A. Strizhev and J.M. Leonard and J.F. Blake and J.B. Matthew", title = "Consensus scoring for ligand/protein interactions", journal = " Journal of Molecular Graphics and Modelling", volume = "20", number = "4", year = "2002", pages = "281-295", } @Article{Paul02, author = "N. Paul and D. Rognan", title = "ConsDock: A new program for the consensus analysis of protein-ligand interactions", journal = "Proteins", volume = "47", year = "2002", pages = "521-533", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-ligand scoring evaluations %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Wang04, author = "R. Wang and Y. Lu and X. Fang and S. Wang", title = "An Extensive Test of 14 Scoring Functions Using {PDBbind} Refined Set of 800 Protein-Ligand Complexes", journal = "J. Chem Inf Comput Sci", volume = "44", year = "2004", pages = "2114-2125", abstract = "Fourteen popular scoring functions, i.e., X-Score, DrugScore, five scoring functions in the Sybyl software (D-Score, PMF-Score, G-Score, ChemScore, and F-Score), four scoring functions in the Cerius2 software (LigScore, PLP, PMF, and LUDI), two scoring functions in the GOLD program (GoldScore and ChemScore), and HINT, were tested on the refined set of the PDBbind database, a set of 800 diverse protein-ligand complexes with high-resolution crystal structures and experimentally determined Ki or Kd values. The focus of our study was to assess the ability of these scoring functions to predict binding affinities based on the experimentally determined high-resolution crystal structures of proteins in complex with their ligands. The quantitative correlation between the binding scores produced by each scoring function and the known binding constants of the 800 complexes was computed. X-Score, DrugScore, Sybyl::ChemScore, and Cerius2::PLP provided better correlations than the other scoring functions with standard deviations of 1.8-2.0 log units. These four scoring functions were also found to be robust enough to carry out computation directly on unaltered crystal structures. To examine how well scoring functions predict the binding affinities for ligands bound to the same target protein, the performance of these 14 scoring functions were evaluated on three subsets of protein-ligand complexes from the test set: HIV-1 protease complexes (82 entries), trypsin complexes (45 entries), and carbonic anhydrase II complexes (40 entries). Although the results for the HIV-1 protease subset are less than desirable, several scoring functions are able to satisfactorily predict the binding affinities for the trypsin and the carbonic anhydrase II subsets with standard deviation as low as 1.0 log unit (corresponding to 1.3-1.4 kcal/mol at room temperature). Our results demonstrate the strengths as well as the weaknesses of current scoring functions for binding affinity prediction.", } @Article{Marsden04, author = "P.M. Marsden and D. Puvanendrampillai and J.B.O. Mitchell and R.C. Glen", title = "Predicting protein ligand binding affinities: a low scoring game?", journal = "Organic Biomolecular Chemistry", volume = "2", year = "2004", pages = "3267-3273", comment = "Compares binding affinities predicted by several scoring functions to measured values and finds poor correlations.", } @Article{Ferrara04, author = "P. Ferrara and H. Gohlke and D.J. Price and G. Klebe and C.L. {Brooks, III}", title = "Assessing Scoring Functions for Protein-Ligand Interactions", journal = "J. Med. Chem.", volume = "47", year = "2004", pages = "3032-3047", } @Article{Xing04, author = "L. Xing and E. Hodgkin and Q. Liu and D. Sedlock", title = "Evaluation and application of multiple scoring functions for a virtual screening experiment", journal = "J Comput. Aided Mol. Des", volume = "18", year = "2004", pages = "333-344", } @Article{Wang03, author = "R. Wang and Y. Lu and S. Wang", title = "Comparative evaluation of 11 scoring functions for molecular docking", journal = "J. Med. Chem.", volume = "46", year = "2003", pages = "2287-2303", } @Article{Wei02, author = "B.Q. Wei and W.A. Baase and L.H. Weaver and B.W. Matthews and B.K. Shoichet", title = "A model binding site for testing scoring functions in molecular docking", journal = "J. Mol. Biol.", volume = "322", year = "2002", pages = "339-355", } @Article{Stahl01, author = "M. Stahl and M. Rarey", title = "Detailed analysis of scoring functions for virtual screening", journal = "J. Med. Chem.", volume = "44", year = "2001", pages = "1035-1042", } @Article{Vieth98b, author = "M. Vieth and J. Hirst and A. Kolinski and C.L. {Brooks, III}", title = "Assessing energy functions for flexible docking", journal = "J. Comput. Chem.", volume = "19", year = "1998", pages = "1612-1622", } @Article{Sotriffer02b, author = "C.A. Sotriffer and H. Gohlke and G. Klebe", title = "Docking into knowledge-based potential fields: A comparative evaluation of {DrugScore}", journal = "J. Med. Chem.", volume = "45", year = "2002", pages = "1967-1970", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-protein binding site analysis %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Chakrabarti02, author = "P. Chakrabarti and J. Janin", title = "Dissecting protein-protein recognition sites", journal = "Proteins: Structure, Function, and Genetics", volume = "47", number = "3", year = "2002", pages = "334-343", abstract = "The recognition sites in 70 pairwise protein-protein complexes of known three-dimensional structure are dissected in a set of surface patches by clustering atoms at the interface. When the interface buries <2000 Angstroms^2 of protein surface, the recognition sites usually form a single patch on the surface of each component protein. In contrast, larger interfaces are generally multipatch, with at least one pair of patches that are equivalent in size to a single-patch interface. Each recognition site, or patch within a site, contains a core made of buried interface atoms, surrounded by a rim of atoms that remain accessible to solvent in the complex. A simple geometric model reproduces the number and distribution of atoms within a patch. The rim is similar in composition to the rest of the protein surface, but the core has a distinctive amino acid composition, which may help in identifying potential protein recognition sites on single proteins of known structures.", } @Article{Jones00, author = "S. Jones and A. Marin and J.M. Thornton", title = "Protein domain interfaces: characterization and comparison with oligomeric protein interfaces", journal = "Protein Engineering", volume = "13", number = "2", pages = "77-82", year = "2000", abstract = "The physical and chemical properties of domain-domain interactions have been analysed in two-domain proteins selected from the protein classification, CATH. The two-domain structures were divided into those derived from (i) monomeric proteins, or (ii) oligomeric or complexed proteins. The size, polarity, hydrogen bonding and packing of the intra-chain domain interface were calculated for both sets of two-domain structures. The results were compared with inter-chain interface parameters from permanent and non-obligate protein-protein complexes. In general, the intra-chain domain and inter-chain interfaces were remarkably similar. Many of the intra-chain interface properties are intermediate between those calculated for permanent and non-obligate inter-chain complexes. Residue interface propensities were also found to be very similar, with hydrophobic residues playing a major role, together with positively charged arginine residues. In addition, the residue composition of the domain interfaces were found to be more comparable with domain surfaces than domain cores. The implications of these results for domain swapping and protein folding are discussed.", } @Article{Bogan98, author = "A.A. Bogan and K.S. Thorn", title = "Anatomy of hot spots in protein interfaces", journal = "J. Mol. Biol.", volume = "280", year = "1998", pages = "1-9", } @Article{DeLano02, author = "W.L. DeLano", title = "Unraveling hot spots in binding interfaces: Progress and challenges", journal = "Curr. Opin. Struct. Biol.", volume = "12", year = "2002", pages = "14-20", } @Article{Hu00, author = "Z. Hu and B. Ma and H. Wolfson and R. Nussinov", title = "Conservation of polar residues as hot spots at protein-protein interfaces", journal = "Proteins", volume = "39", year = "2000", pages = "331-342", } @Article{Jones97, author = "S. Jones and J.M. Thornton", title = "Analysis of protein-protein interaction sites using surface patches", journal = "Journal of Molecular Biology", volume = "272", number = "1", month = "September", year = "1997", pages = "121-132", } @Article{Jones96, author = "S. Jones and J.M. Thornton", title = "Principles of protein-protein interactions", journal = "PNAS", volume = "93", number = "1", year = "1996", pages = "13-20", abstract = "This review examines protein complexes in the Brookhaven Protein Databank to gain a better understanding of the principles governing the interactions involved in protein-protein recognition. The factors that influence the formation of protein-protein complexes are explored in four different types of protein-protein complexeshomodimeric proteins, heterodimeric proteins, enzyme-inhibitor complexes, and antibody-protein complexes. The comparison between the complexes highlights differences that reflect their biological roles.", } @Article{LoConte98, author = "L. {Lo Conte} and C. Chothia and J. Janin", title = "The atomic structure of protein-protein recognition sites", journal = "J Mol Biol", volume = "285", year = "1998", pages = "2177-2198", } @Article{Norel99, author = "R. Norel and D. Petrey and H.J. Wolfson and R. Nussinov", title = "Examination of shape complementarity in docking of unbound proteins", journal = "Proteins", volume = "36", year = "1999", pages = "307-317", } @Article{Larsen98, author = "T.A. Larsen and A.J. Olson and D.S. Goodsell", title = "Morphology of protein-protein interfaces", journal = "Structure", volume = "6", number = "4", year = "1998", pages = "421-427", abstract = "BACKGROUND: Most soluble proteins are active as low-number oligomers. Statistical surveys of oligomeric proteins have defined the roles of hydrophobicity and complementarity in the stability of protein interfaces, but tend to average structural features over a diverse set of protein-protein interfaces, blurring information on how individual interfaces are stabilized. RESULTS: We report a visual survey of 136 homodimeric proteins from the Brookhaven Protein Data Bank, with images that highlight the major structural features of each protein-protein interaction surface. Nearly all of these proteins have interfaces formed between two globular subunits. Surprisingly, the pattern of hydrophilicity over the surface of these interfaces is quite variable. Approximately one-third of the interfaces show a recognizable hydrophobic core, with a single large, contiguous, hydrophobic patch surrounded by a ring of intersubunit polar interactions. The remaining two-thirds of the proteins show a varied mixture of small hydrophobic patches, polar interactions and water molecules scattered over the entire interfacial area. Ten proteins in the survey have intertwined interfaces formed by extensive interdigitation of the two subunit chains. These interfaces are very hydrophobic and are associated with proteins that require both stability and internal symmetry. CONCLUSIONS: The archetypal protein interface, with a defined hydrophobic core, is present in only a minority of the surveyed homodimeric proteins. Most homodimeric proteins are stabilized by a combination of small hydrophobic patches, polar interactions and a considerable number of bridging water molecules. The presence or absence of a hydrophobic core within these interfaces does not correlate with specific protein functions.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-protein binding site prediction %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Neuvirth04, author = "H. Neuvirth and R. Raz and G. Schreiber", title = "{ProMate:} A structure based prediction program to indentify the location of protein-protein binding sites", journal = "J Mol Biol", volume = "338", year = "2004", pages = "181-199", } @article{Espadaler05, author = "J. Espadaler and O. {Romero-Isart} and R.M. Jackson and B. Oliva", title = "Prediction of protein-protein interactions using distant conservation of sequence patterns and structure relationships", journal = "Bioinformatics", volume = "21", year = "2005", pages = "3360-3368", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-protein docking overviews %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Szilagyi05, author = "A. Szilagyi and V. Grimm and A.K. Arakaki and J. Skolnick", title = "Prediction of physical protein-protein interactions", journal = "Phys. Biol.", volume = "2", year = "2005", pages = "S1-S16", abstract = "Many essential cellular processes such as signal transduction, transport, cellular motion and most regulatory mechanisms are mediated by protein-protein interactions. In recent years, new experimental techniques have been developed to discover the protein-protein interaction networks of several organisms. However, the accuracy and coverage of these techniques have proven to be limited, and computational approaches remain essential both to assist in the design and validation of experimental studies and for the prediction of interaction partners and detailed structures of protein complexes. Here, we provide a critical overview of existing structure-independent and structure-based computational methods. Although these techniques have significantly advanced in the past few years, we find that most of them are still in their infancy. We also provide an overview of experimental techniques for the detection of protein-protein interactions. Although the developments are promising, false positive and false negative results are common, and reliable detection is possible only by taking a consensus of different experimental approaches. The shortcomings of experimental techniques affect both the further development and the fair evaluation of computational prediction methods. For an adequate comparative evaluation of prediction and high-throughput experimental methods, an appropriately large benchmark set of biophysically characterized protein complexes would be needed, but is sorely lacking.", } @Article{Salwinski03, author = "L. Salwinski and D. Eisenberg", title = "Computational methods of analysis of protein-protein interactions", journal = "Curr Opin Struct Biol", volume = "13", year = "2003", pages = "377-382", } @Article{Valencia02, author = "A. Valencia and F. Pazos", title = "Computational methods for the prediction of protein interactions", journal = "Curr Opin Struct Biol", volume = "12", year = "2002", pages = "368-373", } @Article{Smith02, author = "G.R. Smitth and M.J.E. Sternberg", title = "Prediction of protein-protein interactions by docking methods", journal = "Current Opinion in Structural Biology", volume = "12", year = "2002", pages = "28-35", abstract = "Recently, developments have been made in predicting the structure of docked complexes when the coordinates of the components are known. The process generally consists of a stage during which the components are combined rigidly and then a refinement stage. Several rapid new algorithms have been introduced in the rigid docking problem and promising refinement techniques have been developed, based on modified molecular mechanics force fields and empirical measures of desolvation, combined with minimisations that switch on the short-range interactions gradually. There has also been progress in developing a benchmark set of targets for docking and a blind trial, similar to the trials of protein structure prediction, has taken place.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-protein docking methods %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Schueler-Furman05, author = "O. Schueler-Furman and C. Wang and D. Baker", title = "Progress in protein-protein docking: Atomic resolution predictions in the {CAPRI} experiment using {RosettaDock} with an improved treatment of side-chain flexibility", journal = "Proteins: Structure, Function, and Bioinformatics", volume = "60", number = "2", year = "2005", pages = "187-194", asbtract = "RosettaDock uses real-space Monte Carlo minimization (MCM) on both rigid-body and side-chain degrees of freedom to identify the lowest free energy docked arrangement of 2 protein structures. An improved version of the method that uses gradient-based minimization for off-rotamer side-chain optimization and includes information from unbound structures was used to create predictions for Rounds 4 and 5 of CAPRI. First, large numbers of independent MCM trajectories were carried out and the lowest free energy docked configurations identified. Second, new trajectories were started from these lowest energy structures to thoroughly sample the surrounding conformation space, and the lowest energy configurations were submitted as predictions. For all cases in which there were no significant backbone conformational changes, a small number of very low-energy configurations were identified in the first, global search and subsequently found to be close to the center of the basin of attraction in the free energy landscape in the second, local search. Following the release of the experimental coordinates, it was found that the centers of these free energy minima were remarkably close to the native structures in not only the rigid-body orientation but also the detailed conformations of the side-chains. Out of 8 targets, the lowest energy models had interface root-mean-square deviations (RMSDs) less than 1.1 Å from the correct structures for 6 targets, and interface RMSDs less than 0.4 Angstroms for 3 targets. The predictions were top submissions to CAPRI for Targets 11, 12, 14, 15, and 19. The close correspondence of the lowest free energy structures found in our searches to the experimental structures suggests that our free energy function is a reasonable representation of the physical chemistry, and that the real space search with full side-chain flexibility to some extent solves the protein-protein docking problem in the absence of significant backbone conformational changes. On the other hand, the approach fails when there are significant backbone conformational changes as the steric complementarity of the 2 proteins cannot be modeled without incorporating backbone flexibility, and this is the major goal of our current work.", } @InProceedings{Choi04, author = "V. Choi and N. Goyal", title = "A Combinatorial Shape Matching Algorithm for Rigid Protein Docking", booktitle = "The Fifteenth Annual Symposium on Combinatorial Pattern Matching ({CPM} 2004)", volume = "{LNCS} 3109", year = "2004", pages = "285-296", } @Article{Meyer96, author = "M. Meyer and P. Wilson and D. Schomburg", title = "Hydrogen bonding and molecular surface shape complementarity as a basis for protein docking", journal = "J. Mol. Biol", volume = "264", year = "1996", pages = "199-210", } @Article{Sobolev96, author = "V. Sobolev and R.C. Wade and G. Vrien and M. Edelman", title = "Molecular docking using surface complementarity", journal = "Proteins Struct. Func. Genet", volume = "25", year = "1996", pages = "120-129", } @Article{Helmer94, author = "M. Helmer-Citterich and A. Tramontano", title = "Puzzle: a new method for automated protein docking based on surface shape complementarity", journal = "J. Mol. Biol", volume = "235", year = "1994", pages = "1021-1031", } @Article{Norel95, author = "R. Norel and S.L. Lin and H.J. Wolfson and R. Nussinov", title = "Molecular surface complementarity at protein-protein interfaces: the critical role played by surface normals at well placed, sparse, points in docking", journal = "J. Mol. Biol", volume = "252", year = "1995", pages = "263-273", } @Article{Young94, author = "L. Young and R.L. Jernigan and D.G. Covell", title = "A role for surface hydrophobicity in protein-protein recognition", journal = "Protein Sci", year = "1994", month = "May", volume = "3", number = "5", pages = "717-29", } @Article{Gabb97, author = "H. Gabb and R. Jackson and M. Sternberg", title = "Modelling protein docking using shape complementarity, electrostatics, and biochemical information", journal = "J. Mol. Bio", volume = "272", year = "1997", pages = "106-120", comment = "``A protein docking study was performed for two classes of biomolecular complexes: six enzyme/inhibitor and four antibody/antigen. Biomolecular complexes for which crystal structures of both the complexed and uncomplexed proteins are available were used for eight of the ten test systems. Our docking experiments consist of a global search of translational and rotational space followed by refinement of the best predictions. Potential complexes are scored on the basis of shape complementarity and favourable electrostatic interactions using Fourier correlation theory. Since proteins undergo conformational changes upon binding, the scoring function must be sufficiently soft to dock unbound structures successfully. Some degree of surface overlap is tolerated to account for side-chain flexibility. Similarly for electrostatics, the interaction of the dispersed point charges of one protein with the Coulombic field of the other is measured rather than precise atomic interactions. We tested our docking protocol using the native rather than the complexed forms of the proteins to address the more scientifically interesting problem of predictive docking. In all but one of our test cases, correctly docked geometries (interface Calpha RMS deviation 100 000 compounds) containing multiple (11) activity classes. Structure-unaware atom count vectors as descriptors in combination with the Euclidean distance measure are able to achieve enrichment factors over random selection of around 4 (depending on the particular class of active compounds), putting the enrichment factors reported for more sophisticated virtual screening methods in a different light. They are also able to retrieve active compounds with novel scaffolds instead of merely the expected structural analogues. The added value of many currently used virtual screening methods (calculated as enrichment factors) drops down to a factor of between 1 and 2, instead of often reported double-digit figures. The observed effect is much less profound for simple descriptors such as molecular weight and is only present in cases of atypical (larger) ligands. The current state of virtual screening is not as sophisticated as might be expected, which is due to descriptors still not being able to capture structural properties relevant to binding. This fact can partly be explained by highly nonlinear structure-activity relationships, which represent a severe limitation of the similar property principle in the context of bioactivity.", } @Article{Lyne02, author = "P.D. Lyne", title = "Structure-based virtual screening: an overview", journal = "DDT", volume = "7", number = "20", month = "October", year = "2002", pages = "1047-1055", abstract = "Enormous advances in genomics have resulted in a large increase in the number of potential therapeutic targets that are available for investigation. This growth in potential targets has increased the demand for reliable target validation, as well as technologies that can identify rapidly several quality lead candidates. Virtual screening, and in particular receptorbased virtual screening, has emerged as a reliable, inexpensive methodfor identifying leads. Although still an evolving method, advances in computational techniques have enabled virtual screening to have a positive impact on the discovery process. Here, the current strengths and weaknesses of the technology are discussed, and emphasis is placed on aspects of the work-flow of a virtual screening campaign, from preparation through to post-screening analysis.", } @Article{Abagyan01, author = "R. Abagyan and M. Totrov", title = "High-throughput docking for lead generation", journal = "Curr Opin Chem Biol", volume = "5", year = "2001", pages = "375-382", abstract = "Recent improvements in flexible docking technology may lead to a bigger role for computational methods in lead discovery. Although fast and accurate computational prediction of binding affinities for an arbitrary molecule is still beyond the limits of current methods, the docking and screening procedures can select small sets of likely lead candidates from large libraries of either commercially or synthetically available compounds.", } @Article{Walters98, author = "W.P.Walters and M.T. Stahl and M.A. Murcko", title = "Virtual screening - an overview", journal = "Drug Discov Today", volume = "3", year = "1998", pages = "160-178", } @Article{Shirai01, author = "H. Shirai and J. Shi and T.L. Blundell and K. Mizuguchi", title = "Structural bioinformatics as an approach to genomics-based drug discovery", journal = "Global Outsourcing Review", volume = "3", year = "2001", pages = "48-53", } @Misc{Bajorath02, author = "J. Bajorath", title = "Virtual screening in drug discovery: methods, expectations and reality", note = "www.current drugdiscovery.com", month = "March", year = "2002", comment = "Provides overview of virtual screening, points to successes", } @Article{Barril04, title = "Virtual Screening in Structure-Based Drug Discovery", author = "X. Barril and R.E. Hubbard and S.D. Morley", journal = "Mini Reviews in Medicinal Chemistry", volume = "4", number = "7", month = "September", year = "2004", pages = "779-791", abstract = "Recent advances in structure determination and computational methods have encouraged the development of structure-based virtual screening. Here we survey progress in the field and review the most recent methods, validation experiments and real applications, including an in-house example of hit identification for the oncology target Hsp90. These results provide a basis for discussing the current state of structure-based virtual screening and to outline the developments that are expected to have a major impact in the near future.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Ligand-based drug screening methods %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Paul04, author = "N. Paul and E. Kellenberger and G. Bret and P. Muller and Didier Rognan", title = "Recovering the True Targets of Specific Ligands by Virtual Screening of the Protein Data Bank", journal = "PROTEINS: Structure, Function, and Bioinformatics", volume = "54", year = "2004", pages = "671-680", } @Article{Zauhar03, author = "R.J. Zauhar and G. Moyna and L. Tian and Z. Li and W.J. Welsh", title = "Shape Signatures: A New Approach to Computer-Aided Ligand- and Receptor-Based Drug Design", journal = "J. Med. Chem.", volume = "46", year = "2003", pages = "5674-5690", abstract = "A unifying principle of rational drug design is the use of either shape similarity or complementarity to identify compounds expected to be active against a given target. Shape similarity is the underlying foundation of ligand-based methods, which seek compounds with structure similar to known actives, while shape complementarity is the basis of most receptorbased design, where the goal is to identify compounds complementary in shape to a given receptor. These approaches can be extended to include molecular descriptors in addition to shape, such as lipophilicity or electrostatic potential. Here we introduce a new technique, which we call shape signatures, for describing the shape of ligand molecules and of receptor sites. The method uses a technique akin to ray-tracing to explore the volume enclosed by a ligand molecule, or the volume exterior to the active site of a protein. Probability distributions are derived from the ray-trace, and can be based solely on the geometry of the reflecting ray, or may include joint dependence on properties, such as the molecular electrostatic potential, computed over the surface. Our shape signatures are just these probability distributions, stored as histograms. They converge rapidly with the length of the ray-trace, are independent of molecular orientation, and can be compared quickly using simple metrics. Shape signatures can be used to test for both shape similarity between compounds and for shape complementarity between compounds and receptors and thus can be applied to problems in both ligand- and receptor-based molecular design. We present results for comparisons between small molecules of biological interest and the NCI Database using shape signatures under two different metrics. Our results show that the method can reliably extract compounds of shape (and polarity) similar to the query molecules. We also present initial results for a receptor-based strategy using shape signatures, with application to the design of new inhibitors predicted to be active against HIV protease.", } @Article{Chen01, author = "Y.Z. Chen and D.G. Zhi", title = "Ligand-Protein Inverse Docking and Its Potential Use in the Computer Search of Protein Targets of a Small Molecule", journal = "PROTEINS: Structure, Function, and Genetics", volume = "43", pages = "217-226", year = "2001", abstract = "Ligand-protein docking has been developed and used in facilitating newdrug discoveries. In this approach, docking single or multiple small molecules to a receptor site is attempted to find putative ligands. A number of studies have shown that docking algorithms are capable of finding ligands and binding conformations at a receptor site close to experimentally determined structures. These algorithms are expected to be equally applicable to the identification of multiple proteins to which a small molecule can bind or weakly bind. We introduce a ligand-protein inverse-docking approach for finding potential protein targets of a small molecule by the computer-automated docking search of a protein cavity database. This database is developed from protein structures in the Protein Data Bank (PDB). Docking is conducted with a procedure involving multiple-conformer shapematching alignment of a molecule to a cavity followed by molecular-mechanics torsionoptimization and energy minimization on both the molecule and the protein residues at the binding region. Scoring is conducted by the evaluation of molecular-mechanics energy and, when applicable, by the further analysis of binding competitiveness against other ligands that bindto the same receptor site inat least one PDB entry. Testing results on two therapeutic agents, 4H-tamoxifen and vitamin E, showed that 50\% of the computer-identified potential protein targets were implicated or confirmed by experiments. The application of this approach may facilitate the prediction of unknown and secondary the rapeutic target proteins and those related to the side effects and toxicity of a drug or drug candidate.", } @Article{Labute05, author = "P. Labute", title = "On the perception of molecules from 3D atomic coordinates", journal = "J Chem Inf Model", volume = "45", number = "2", year = "2005", pages = "215-221", abstract = "A method is presented for perceiving chemical types of atoms in molecules given 3D atomic coordinates and element identities. The method assigns hybridizations, bond orders, and formal charges for structures whether hydrogen atoms are present. The Maximum Weighted Matching algorithm for nonbipartite graphs is used to assign bond orders with weights derived from statistics of a large collection of organic molecules. Results form tests on a collection of functional groups, heterocycles, entries from the Protein Data Bank, and Cambridge Structural Database as well as a comparison to other methods, are presented and discussed.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Structure-based drug design overviews %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Beavers02, author = "M.P. Beavers and X. Chen", title = "Structure-based combinatorial library design: methodologies and applications", journal = "Journal of Molecular Graphics and Modelling", volume = "20", year = "2002", pages = "463-468", abstract = "Rational design of small focused libraries that are biased toward specific therapeutic targets is currently at the forefront of combinatorial library design. Various structure-based design strategies can be implemented in focused library design when the 3D structure of the target is available through X-ray or NMR determination. This review discusses the major methods and programs specifically developed for the purpose of designing combinatorial libraries under the constraint of the binding site of a biological target, with emphasis on their advantages and disadvantages. Examples of the successful application of these methodologies are highlighted, demonstrating their performances within the practical drug discovery process.", } @Article{Veselovsky03, author = "A.V. Veselovsky and A.S. Ivanov", title = "Strategy of Computer-Aided Drug Design", journal = "Current Drug Targets - Infectious Disorders", volume = "3", number = "1", month = "March", year = "2003", pages = "33-40", abstract = "Modern strategies of computer-aided drug design (CADD) are reviewed. The task of CADD in the pipeline of drug discovery is accelerating of finding the new lead compounds and their structure optimization for the following pharmacological tests. The main directions in CADD are based on the availability of the experimentally determined three-dimensional structure of the target macromolecule. If spatial structure is known the methods of structure-based drug design are used. In the opposite case the indirect methods of CADD based on the structures of known ligands (ligand-based drug design) are used. The interrelationship between the main directions of CADD is reviewed. The main CADD approaches of molecule de novo design and database mining are described. They include methods of molecular docking, de novo design, design of pharmacophore and quantity structure-activity relationship models. New ways and perspectives of CADD are discussed.", } @Article{Klebe00, author = "G. Klebe", title = "Recent developments in structure-based drug design", journal = "J Mol Med", volume = "78", year = "2000", pages = "269-281", } @Article{Gane00, author = "P.J. Gane and P.M. Dean", title = "Recent advances in structure-based rational drug design", journal = "Curr Opin Struct Biol", volume = "10", year = "2000", pages = "401-404", } @Article{Ooms00, author = "F. Ooms", title = "Molecular Modeling and Computer Aided Drug Design. Examples of their Applications in Medicinal Chemistry", journal = "Current Medicinal Chemistry", volume = "7", year = "2000", pages = "141-158", abstract = "The development of new drugs with potential therapeutic applications is one of the most complex and difficult process in the pharmaceutical industry. Millions of dollars and man-hours are devoted to the discovery of new therapeutical agents. As, the activity of a drug is the result of a multitude of factors such as bioavailability, toxicity and metabolism, rational drug design has been utopias for centuries. Very recently, impressive technological advances in areas such as structural characterization of biomacromolecules, computer sciences and molecular biology have made rational drug design feasible. The aim of this review is to give an outline of studies in the field of medicinal chemistry in which molecular modeling has helped in the discovery process of new drugs. The emphasis will be on lead generation and optimization.", } @Article{Anderson02, author = "S. Anderson and J. Chiplin", title = "Structural genomics: shaping the future of drug design?", journal = "Drug Discov Today", volume = "7", year = "2002", pages = "105-107", } @Article{Marrone97, author = "T.J. Marrone and J.M. Briggs and J.A. McCammon", title = "Structure-based drug design: Computational Advances", journal = "Annu. Rev. Pharmacol. Toxicol.", volume = "37", year = "1997", pages = "71-90", } @Article{Bohacek97, author = "R.S. Bohacek and C. McMartin", title = "Modern computational chemistry and drug discovery: structure generating programs", journal = "Curr. Opin. Chem. Biol.", volume = "1", year = "1997", pages = "157-161", comment = "``During 1996 and 1997, the first reports were disclosed of active enzyme inhibitors based entirely on novel structures created by de novo methods. De novo methods have also been used to modify and significantly improve the binding affinity of an HIV protease inhibitor. Work continues in the improvement of methods for the de novo design of compounds which fit and chemically complement a binding site. De novo algorithms that generate only synthetically feasible structures have also been reported. In addition, methods are being developed for the automatic computer generation of virtual molecular libraries which can be searched to identify molecules to match a pharmacophore or fit into a binding site.''", } @InCollection{Charifson97, author = "P. Charifson and I.D. Kuntz", title = "Recent Successes and Continuing Limitations in Computer-Aided Drug Design", booktitle = "Practical Application of Computer-Aided Drug Design", publisher = "Marcel-Dekker", location = "New York", year = "1997", pages = "1-37", } @Article{Kuntz92, author = "D. Kuntz", title = "Structure-based Strategies for Drug Design and Discovery", journal = "Science", volume = "257", pages = "1078-1082", year = "1992", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Structure-based drug design with fragment-based methods %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Buhm92, author = "H.J. Buhm", title = "The Computer Program {Ludi}: A New Method for the De Novo Design of Enzyme Inhibitors", journal = "J. Comp. Aided Molec. Design", volume = "6", year = "1992", pages = "61-78", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Structure-based drug design with knowledge-based methods %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Grzybowski02, author = "B.A. Grzybowski and A.V. Ishchenko and J. Shimada and E.I Shakhnovich", title = "From Knowledge-Based Potentials to Combinatorial Lead Design in Silico", journal = "Acc. Chem. Res.", volume = "35", year = "2002", pages = "261-262", abstract = "Computational methods are becoming increasingly used in the drug discovery process. In this Account, we review a novel computational method for lead discovery. This method, called CombiSMoG for `combinatorial small molecule growth', is based on two components: a fast and accurate knowledge-based scoring function used to predict binding affinities of protein-ligand complexes, and a Monte Carlo combinatorial growth algorithm that generates large numbers of low-free-energy ligands in the binding site of a protein. We illustrate the advantages of the method by describing its application in the design of picomolar inhibitors for human carbonic anhydrase.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Structure-based drug design with ... %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Eisen94, author = "M.B. Eisen and D.C. Wiley and M. Karplus and R.E. Hubbard", title = "{HOOK:} A Program for finding novel molecular architectures that satisfy the chemical and steric requirements of a macromolecule binding site", journal = "Proteins", volume = "19", year = "1994", pages = "199-221", } @Article{vonItzstein93, author = "Mark {von Itzstein} and Wen-Yang Wu and Gaik B. Kok and Michael S. Pegg and Jeffrey C. Dyason and Betty Jin and Tho Van Phan and Mark L. Smythe and Hume F. White and Stuart W. Oliver and Peter M. Colman and Joseph N. Varghese and D. Michael Ryan and Jacqueline M. Woods and Richard C. Bethell and Vanessa J. Hotham and Janet M. Cameron and Charles R. Penn", title = "Rational design of potent sialidase-based inhibitors of influenza virus replication", journal = "Nature", volume = "363", pages = "418-423", month = "June", year = "1993", comment = "Uses GRID for drug design", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Quantitative structure activity relationship (QSAR) overviews %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Winkler01, author = "D.A. Winkler", title = "The role of quantitative structure-activity relationships (QSAR) in biomolecular discovery", journal = "Briefings in Bioinformatics", volume = "3", number = "1", year = "2002", pages = "73-86", abstract = "Empirical methods for building predictive models of the relationships between molecular structure and useful properties are becoming increasingly important. This has arisen because drug discovery and development have become more complex. A large amount of biological target information is becoming available through molecular biology. Automation of chemical synthesis and pharmacological screening has also provided a vast amount of experimental data. Tools for designing libraries and extracting information from molecular databases and high-throughput screening experiments robustly and quickly enable leads to be discovered more effectively. As drug leads progress down the development pipeline, the ability to predict physicochemical, pharmacokinetic and toxicological properties of these leads is becoming increasingly important in reducing the number of expensive, late development failures. Quantitative structure-activity relationship (QSAR) methods have much to offer in these areas. However, QSAR analysis has many traps for unwary practitioners. This review introduces the concepts behind QSAR, points out problems that may be encountered, suggests ways of avoiding the pitfalls and introduces several exciting, new QSAR methods discovered during the last decade.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein-DNA binding %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Havranek04, author = "J.J. Havranek and C.M. Duarte and D. Baker", title = "A simple physical model for the prediction and design of protein-DNA interactions", journal = "J Mol Biol", year = " 2004", volume = "344", pages = "59-70", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Molecular surfaces %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Connolly83, author = "M.L. Connolly", title = "Solvent-accessible surfaces of proteins and nucleic acids", journal = "Science", volume = "221", pages = "709-713", year = "1983", comment = "This is the main reference for the Connolly surface", } @Article{Connolly83b, author = "M. L. Connolly", title = "Analytical Molecular Surface Calculation", journal = "Journal of Applied Crystallography", year = "1983", volume = "16", pages = "548-558", } @Article{Connolly85, author = "M.L. Connolly", title = "Molecular surface triangulation", journal = "J. Appl. Crystallogr.", volume = "18", year = "1985", pages = "499-505", } @Article{Connolly86a, author = "M.L. Connolly", title = "Measurement of protein surface shape by solid angles", journal = "J. Mol. Graphics", volume = "4", year = "1986", pages = "3-6", } @Article{Connolly86b, author = "M.L. Connolly", title = "Plotting protein surfaces", journal = "J. Mol. Graphics", volume = "4", year = "1986" , pages = "93-96", } @Article{Connolly93, author = "M.L. Connolly", title = "The molecular surface package", journal = "J. Mol. Graphics", volume = "11", year = "1993", pages = "139-141", comment = "http://www.biohedron.com/", } @Article{Sanner96, author = "M.F. Sanner and J.C. Spehner and A.J. Olson", title = "Reduced surface: an efficient way to compute molecular surfaces", journal = "Biopolymers", volume = "38", number = "3", year = "1996", pages = "305-320", comment = "http://www.scripps.edu/pub/olson-web/people/sanner/html/msms_home.html", } @Article{Eisenhaber93, author = "F. Eisenhaber and P. Argos", title = "Improved Strategy in Analytic Surface Calculation for Molecular Systems: Handling of Singularities and Computational Efficiency", journal = "Journal of Computational Chemistry", volume = "14", number = "11", year = "1993", pages = "1272-1280", comment = "http://mendel.imp.univie.ac.at/SURFACE/ASC/asc2.html", } @Article{Eisenhaber95, author = "F. Eisenhaber and P. Lijnzaad and P. Argos and C. Sander and M. Scharf", title = "The Double Cubic Lattice Method: Efficient approaches to numerical integration of surface area and volume and to dot surface contouring of molecular assemblies", journal = "J. Comp. Chem.", volume = "16", number = "3", year = "1995", pages = "273-284", } @Article{Lee71, author = "B. Lee and F.M. Richards", title = "The Interpretation of Protein Structures: Estimation of Static Accessibility", journal = "Journal of Molecular Biology", volume = "55", year = "1971", pages = "379-400", comment = "This is the main reference for the solvent accessible surface", } @Article{Greer78, author = "J. Greer and B. Bush", title = "Macromolecular Shape and SurfaceMaps by Solvent Exclusion", journal = "Proceedings of the National Academy of Sciences USA", year = "1978", volume = "75", pages = "303-307", comment = "Early method for computing solvent accessible surfaces", } @Article{ODonnell92, author = "T.J. O'Donnell", title = "Interactive Computation and Display of Molecular Surfaces", journal = "Journal of Molecular Graphics", year = "1992", volume = "10", pages = "39-40", } @Article{Klein90, author = "T. Klein and C. Huang and E. Pettersen and G. Couch and T. Ferrin and R. Langridge", title = "A Real-Time Malleable Molecular Surface", journal = "Journal of Molecular Graphics", volume = "8", year = "1990", pages = "16-24 and 26-27", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Secondary Structure Prediction %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Rost03, author = "B. Rost", title = "Prediction in {1D:} secondary structure, membrane helices, and accessibility", journal = "Methods Biochem. Anal.", volume = "44", year = "2003", pages = "559-587", } @Article{Kabsch83, author = "W. Kabsch and C. Sander", title = "Dictionary of Protein Secondary Structure: Pattern Recognition of Hydrogen-Bonded and Geometrical Features", journal = "Biopolymers", volume = "22", year = "1983", pages = "2577-2637", comment = "This is a paper about DSSP, a method for predicting secondary structure from sequence", } @Article{Jones99, author = "D.T. Jones", title = "Protein secondary structure prediction based on position-specific scoring matrices", journal = "J. Mol. Biol.", volume=292, year = 1999, pages= "195--202" comment = "PSIPRED: One of the leading protein secondary structure prediction methods", } @Article{King96, author = "R.D. King and M.J.E. Sternberg", title = "Identification and application of the concepts important for accurate and reliable protein secondary structure prediction", journal = "Prot. Sci.", volume = "5", year = "1996", pages = "2298-2310", } @Article{Garnier96, author = "J. Garnier and J.F. Gibrat and B. Robson", title = "{GOR} method for predicting protein secondary structure from amino acid sequence", journal = "Methods Enzymol", volume = "266", year = "1996", pages = "540-553", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Tertiary structure prediction overviews %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Schueler-Furman05, title = "Progress in modeling of protein structures and interactions", author = "O. {Schueler-Furman} and C. Wang, C. and P. Bradley and K. Misura and D. Baker", journal = "Science", volume = "310", number = "5748", pages = "638-642", month = "Oct", year = "2005", url = "http://depts.washington.edu/bakerpg/papers/SchuelerFurman-Science-v310-p638.pdf", abstract = "The prediction of the structures and interactions of biological macromolecules at the atomic level and the design of new structures and interactions are critical tests of our understanding of the interatomic interactions that underlie molecular biology. Equally important, the capability to accurately predict and design macromolecular structures and interactions would streamline the interpretation of genome sequence information and allow the creation of macromolecules with new and useful functions. This review summarizes recent progress in modeling that suggests that we are entering an era in which high-resolution prediction and design will make increasingly important contributions to biology and medicine.", } @Book{Sternberg97, author = "M.J.E. Sternberg", title = "Protein Structure Prediction - A practical approach", publisher = "Oxford University Press", year = "1997", note = "{ISBN:0199634963}", url = "http://www.amazon.com/exec/obidos/tg/detail/-/0199634963/qid=1127051707/sr=1-1/ref=sr_1_1/104-9907891-5367125?v=glance&s=books", } @Article{Baker01, author = "D. Baker and A. Sali", title = "Protein Structure Prediction and Structural Genomics", journal = "Science", volume = "294", number = "5540", year = "2001", pages = "93-96", } @Article{Jones00, author = "D.T. Jones", title = "Protein Structure Prediction in the Postgenomic Era", journal = "Current Opinion in Structural Biology", volume = "10", number = "3", month = "June", year = "2000", pages = "371-379", } @Article{Simons01, author = "K.T. Simons, C. Strauss, and D. Baker", title = "Prospects for ab initio Protein Structural Genomics", journal = "J. Molecular Biology", volume = "306", number = "5", year = "2001", pages = "1191-1199", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Tertiary structure prediction evaluations %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Moult03, author = "J. Moult and K. Fidelis and A. Zemla and T. Hubbard", title = "Critical assessment of methods of protein structure prediction {(CASP)} - round {V}", journal = "Proteins: Structure, Function, and Genetics", volume = "53", number = "S6" , pages = "334-339", abstract = "This article provides an introduction to the special issue of the journal Proteins dedicated to the fifth CASP experiment to assess the state of the art in protein structure prediction. The article describes the conduct, the categories of prediction, and the evaluation and assessment procedures of the experiment. A brief summary of progress over the five CASP experiments is provided. Related developments in the field are also described.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Tertiary structure prediction with ab initio methods %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Floudas06, author = "C.A. Floudas and H.K. Fung and S.R. McAllister and M. {M\"onnigmann} and R. Rajgaria", title = "Advances in Protein Structure Prediction and De Novo Protein Design: A review", journal = "Chem. Eng. Sci.", year = "2006", volume = "61", pages = "966--988" comment = "Review paper for protein structure prediction and de novo protein design.", } @article{Klepeis02, AUTHOR = "J.L. Klepeis and C.A. Floudas", TITLE = "Ab initio prediction of helical segments in polypeptides", YEAR = "2002", JOURNAL = "J. Comput. Chem.", NUMBER = "2", VOLUME = "23", PAGES = "245--266" comment = "Method for predicting helical regions using detailed atomistic level modeling of overlapping oligopeptides.", } @Article{Klepeis03a, author = "J.L. Klepeis and C.A. Floudas", title = "Prediction of beta-sheet topology and disulfide bridges in polypeptides", journal = "J. Comput. Chem.", year = "2003", volume = "24", pages = "191-208" comment = "Method for predicting beta-strand locations and b-sheet topology using optimization techniques", } @Article{Klepeis03b, author = "J.L. Klepeis and C.A. Floudas", title = "{ASTRO-FOLD}: A Combinatorial and Global Optimization Framework for Ab Initio Prediction of Three-Dimensional Structures of Proteins from the Amino Acid Sequence", journal = "Biophys. J.", year = "2003", volume = 85, pages = "2119--2146" comment = "First principles framework for protein structure prediction", } @article{Monningmann05, author = "M. {M\"onnigmann} and C.A. Floudas", title = "Protein Loop Structure Prediction With Flexible Stem Geometries", journal = "Prot. Struct. Funct. Bioinf.", year = "2005", volume= "61", pages = "748-762" comment = "Loop structure prediction method for loops with flexible stems. Uses dihedral angle sampling and introduces a novel use of clustering.", } @Article{Liwo02, author = "A. Liwo and P. Arlukowicz and C. Czaplewski and S. Oldziej and J. Pillardy and H.A. Scheraga", title = "A method for optimizing potential-energy functions by hieracrchical design of the potential-energy landscape: Application to the {UNRES} force field", journal = "PNAS", year = "2002", volume = "99", pages = "1937-1942" comment = "One of the more recent papers by Scheraga and co-workers detailing the use of the united residue (UNRES) approach for protein tertiary structure prediciton", } @Article{Skolnick03, author = "J. Skolnick and Y. Zhang and A. K. Arakaki and A. Kolinski and M. Boniecki and A. {Szil\'agyi} and D. Kihara", title = "{TOUCHSTONE}: A Unified Approach to Protein Structure Prediction", journal = "Prot. Struct. Funct. Bioinf.", year = "2003", volume = "53", pages = "469-479" } @Article{Rohl04, author = "C.A. Rohl and C.E. Strauss and K.M. Misura and D. Baker", title = "Protein structure prediction using Rosetta", journal = "Methods Enzymol", volume = "383", year = "2004", pages = "66-93", url = "http://depts.washington.edu/bakerpg/papers/Rohl-MethEnz-v383-p66.pdf", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Tertiary structure prediction with x-ray crystallography %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{David03, author = "A.M. Davis and S.J. Teague and G.J. Kleywegt", title = "Application and limitations of X-ray crystallographic data in structure-based ligand and drug design", journal = "Angew. Chem., Int. Ed.", volume = "42", year = "2003", pages = "2718-2736", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Tertiary structure prediction with homology modeling (comparative modeling) %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Madhusudhan05, author = "M.S. Madhusudhan and M.A. Marti-Renom and N. Eswar and B. John and U. Pieper and R. Karchin and M.-Y. Shen and A. Sali", title = "Comparative protein structure modeling", journal = "The Proteomics Protocols Handbook", publisher = "Humana Press, Totowa, NJ", year = "2005", pages = "831-860", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Tertiary structure prediction with threading (fold recognition) %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Godzik03, author = "A. Godzik", title = "Fold recognition methods", journal = "Methods Biochem. Anal.", volume = "44", year = "2003", pages = "525-546", } @Article{Lathrop94, author = "R.H. Lathrop", title = "The protein threading problem with sequence amino acid intraction preferences is NP-complete", journal = "Protein Eng", volume = "7", number = "9", year = "1994", pages = "1059-1068", } @Article{Xu03, author = "J. Xu and M. Li and D. Kim and Y. Xu", title = "{RAPTOR}: Optimial Protein Threading by Linear Programming", journal = "J.Bioinf. Comput. Biol.", year = "2003", volume = "1", pages = "95-117", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Tertiary structure prediction with hybrid methods %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Alber04, author = "F. Alber and N. Eswar and A. Sali", title = "Structure determination of macromolecular complexes by experiment and computation", journal = "Practical Bioinformatics", volume = "15", publisher = "Springer, New York", year = "2004", pages = "73-96", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein structure evaluation %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Eyal05, author = "E. Eyal and S. Gerzon and V. Potapov and M. Edelman and V. Sobolev", title = "The Limit of Accuracy of Protein Modeling: Influence of Crystal Packing on Protein Structure", journal = "j. Mol Biol.", volume = "351", year = "2005", pages = "431-442", abstract = "The size of the protein database (PDB) makes it now feasible to arrive at statistical conclusions regarding structural effects of crystal packing. These effects are relevant for setting upper practical limits of accuracy on protein modeling. Proteins whose crystals have more than one molecule in the asymmetric unit or whose structures were determined at least twice by X-ray crystallography were paired and their differences analyzed. We demonstrate a clear influence of crystal environment on protein structure, including backbone conformations, hinge-like motions and side-chain conformations. The positions of surface water molecules tend to be variable in different crystal environments while those of ligands are not. Structures determined by independent groups vary more than structures determined by the same authors. The use of different refinement methods is a major source for this effect. Our pair-wise analysis derives a practical limit to the accuracy of protein modeling. For different crystal forms, the limit of accuracy (Ca, root-mean-square deviation (RMSD)) isw0.8 A ° for the entire protein, which includes w0.3 A ° due to crystal packing. For organized secondary elements, the upper limit of Ca RMSD is 0.5Â-0.6 A ° while for loops or protein surface it reaches 1.0 A °. Twenty percent of exposed sidechains exhibit different c1C2 conformations with approximately half of the effect also resulting from crystal packing. Aweb based tool for analysis and graphic presentation of surface areas of crystal contacts is available (http://ligin.weizmann.ac.il/cryco).", } @Article{Wei99, author = "L. Wei and E.S. Huang and R.B. Altman", title = "Are predicted structures good enough to preserve functional sites?", journal = "Structure Fold Des", year = "1999", volume = "7", number = "6", pages = "643-650", comment = "``BACKGROUND: A principal goal of structure prediction is the elucidation of function. We have studied the ability of computed models to preserve the microenvironments of functional sites. In particular, 653 model structures of a calcium-binding protein (generated using an ab initio folding protocol) were analyzed, and the degree to which calcium-binding sites were recognizable was assessed. RESULTS: While some model structures preserve the calcium-binding microenvironments, many others, including some with low root mean square deviations (rmsds) from the crystal structure of the native protein, do not. There is a very weak correlation between the overall rmsd of a structure and the preservation of calcium-binding sites. Only when the quality of the model structure is high (rmsd less than 2 A for atoms in the 7 A local neighborhood around calcium) does the modeling of the binding sites become reliable. CONCLUSIONS: Protein structure prediction methods need to be assessed in terms of their preservation of functional sites. High-resolution structures are necessary for identifying binding sites such as calcium-binding sites.''", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Cryo-EM structures %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Chiu05, author = "W. Chiu and M.L. Baker and W. Jiang and M. Dougherty and M.F. Schmid", title = "Electron cryomicroscopy of biological machines at subnanometer resolution", journal = "Structure", volume = "13", year = "2005", pages = "363-372", } @Article{Frank02, author = "J. Frank", title = "Single-particle imaging of macromolecules by cryo-electron microscopy", journal = "Annu. Rev. Biophys. Biomol. Struct.", volume = "31", year = "2002", pages = "303-319", } author = "R.J. Kuhn and W. Zhang and M.G. Rossmann and S.V. Pletnev and J. Corver and E. Lenches and C.T. Jones and S. Mukhopadhyay and P.R. Chipman and E.G. Strauss", title = "Structure of dengue virus: implications for flavivirus organization, maturation, and fusion", journal = "Cell", volume = "108", year = "2002", pages = "717-725", comment = "Fitting rigid x-ray structures into cryo-em map", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Prediction of protein side-chain rotamers %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Bower99, author = "M. J. Bower and F.E. Cowen and R.L. Dunbrack", title = "Prediction of protein side-chain rotamers from a backbone-dependent rotamer library: a new homology modeling tool", journal = "J. Mol. Biol.", year = "1999", volume = "267", pages= "1268-1282", comment = "This is a reference for the Dunbrack rotamer library", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Analysis of residue conservation %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Mayrose04, author = "I. Mayrose and D. Graur and N. Ben-Tal and T. Pupko", year = "2004", title = "Comparison of site-specific rate-inference methods for protein sequences: Bayesian methods are superior", journal = "Mol Biol Evol", volume = "21", pages = "1781-1791", } @Article{Glaser05, author = "F. Glaser and Y. Rosenberg and A. Kessel and T. Pupko and N. {Ben-Tal}", year = "2005", title = "The {ConSurf-HSSP} database: The mapping of evolutionary conservation among homologs onto PDB structures", journal = "PROTEINS: Structure, Function, and Bioinformatics", volume = "58", pages = "610-617", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Protein design %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Baker06, author = "D. Baker", title = "Prediction and design of macromolecular structures and interactions", journal = "Philos Trans R Soc Lond B Biol Sci.", volume = "361", number = "1467", year = "2006", pages = "459-463", } @Article{Kuhlman03, title = "Design of a Novel Globular Protein Fold with Atomic-Level Accuracy", author = "B. Kuhlman and G. Dantas and G.C. Ireton and G. Varani and B.L. Stoddard and D. Baker", journal = "Science", volume = "302", number = "5649", month = "November", year = "2003", pages = "1364-1368", url = "http://www.sciencemag.org/cgi/content/full/302/5649/1364", abstract = "A major challenge of computational protein design is the creation of novel proteins with arbitrarily chosen three-dimensional structures. Here, we used a general computational strategy that iterates between sequence design and structure prediction to design a 93-residue /ß protein called Top7 with a novel sequence and topology. Top7 was found experimentally to be folded and extremely stable, and the x-ray crystal structure of Top7 is similar (root mean square deviation equals 1.2 angstroms) to the design model. The ability to design a new protein fold makes possible the exploration of the large regions of the protein universe not yet observed in nature.", } %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Not classified yet %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @Article{Aloy01, author = "P. Aloy and E. Querol and F.X. Aviles and M.J.E. Sternberg", title = "Automated structure-based prediction of functional sites in proteins: applications to assessing the validity of inheriting protein function from homology in genome annotation and to protein docking", year = "2001", journal = "J. Mol. Biol", volume = "311", pages = "395-408", } @InProceedings{TenEyck95, author = "L.F. Ten Eyck and J. Mandell and V.A. Roberts and M.E. Pique", title = "Surveying molecular interactions with DOT", booktitle = "1995 ACM/IEEE Supercomputing Conference", location = "New York", year = "1995", } @Article{Zhang05, author = "Y. Zhang and J. Skolnick", title = "The protein structure prediction problem could be solved using the current {PDB} library", journal = "PNAS", volume = "102", number = "4", year = "2005", pages = "1029-1034", } @Article{Glick02, author = "M. Glick and D.D. Robinson and G.H. Grant and W.G. Richards", title = "Identification of ligand binding sites on proteins using a multiscale approach", journal = "J. Am. Chem. Soc.", year = "2002", volume = "124", pages = "2337-2344", } @Article{Todd02, author = "A.E. Todd and C.A. Orengo and J.M. Thornton", title = "Plasticity of enzyme active sites", journal = "Trends in Biochemical Sciences", volume = "27", year = "2002", pages = "419-426", comment = "The expectation is that any similarity in reaction chemistry shared by enzyme homologues is mediated by common functional groups conserved through evolution. However, detailed enzyme studies have revealed the flexibility of many active sites, in that different functional groups, unconserved with respect to position in the primary sequence, mediate the same mechanistic role. Nevertheless, the catalytic atoms might be spatially equivalent. More rarely, the active sites have completely different locations in the protein scaffold. This variability could result from: (1) the hopping of functional groups from one position to another to optimize catalysis; (2) the independent specialization of a low-activity primordial enzyme in different phylogenetic lineages; (3) functional convergence after evolutionary divergence; or (4) circular permutation events.", } @Article{Pearl93, author = "L Pearl", title = "Similarity Of Active-Site Structures", journal = "Nature", volume = "362", year = "1993", pages = "24-24", comment = "This paper observes the similarities in the active sites of serine proteases", } @Article{Carlson02, author = "H.A. Carlson", title = "Protein Flexibility is an Important Component of Structure-Based Drug Discovery", journal = "Current Pharmaceutical Design", volume = "8", number = "17", year = "2002", pages = "1571-1578", abstract = "Receptor-based drug discovery can increase the novelty of a hit list over ligandbased models that are dependent on known inhibitors. It is important to explore new conformational and chemical space, but it is difficult to predict the plasticity of the binding site. Receptor-based methods are usually based on crystal structures of ligand-protein complexes, and hit lists can be restricted to the size and shape of the receptor model. Many improvements that accommodate protein flexibility in computer-aided drug design are being developed. These methods are reviewed with the focus being techniques that move beyond the rotation of side chains.The use of multiple protein structures is emerging as the best choice for including more realistic changes in protein conformation, but the optimal way to using these structures is still unclear.", } @Article{Betz02, author = "S.F. Betz and S.M. Baxter and J.S. Fetrow", title = "Function first: a powerful approach to post-genomic drug discovery", journal = "DDT", volume = "7", number = "16", month = "August", year = "2002", abstract = "In the post-genomic era, pharmaceutical researchers must evaluate vast numbers of protein sequences and formulate novel, intelligent strategies for identifying valid targets and discovering leads against them. The identification of small molecules that selectively target proteins or protein families will be aided by knowing the function and/or the structure of the target(s). By identifying protein function first, efficiencies are gained that allow subsequent focus of resources on particular protein families of interest. This article reviews current proteomic-scale approaches to identifying function as a way of accelerating lead discovery.", } @Article{Xie05, author = "L. Xie and P.E. Bourne", title = "Functional Coverage of the Human Genome by Existing Structures, Structural Genomics Targets and Homology Models", journal = "PLoS Comp Biol", volume = "1", number = "3", year = "2005", pages = "e31", abstract = "The sequencing of the human genome provides biologists with new opportunities to understand the molecular basis of physiological processes and disease states. To take full advantage of these opportunities the three-dimensional structure of the gene products are needed to provide the appropriate level of detail. Since protein structure determination lags behind protein sequence determination an important and on-going question becomes, what degree of coverage of the human proteome do we have from experimental structures and what can we infer by modeling? Or turning the question around, what structures do we need to determine (the most wanted list) to further our understanding of the human condition? This paper addresses these questions through integration of existing data resources correlated using comparative functional features, namely the gene ontology (GO) describing biochemical process, molecular function and cellular location for all types of proteins and the Enzyme Commission (EC) classification for enzymes. Genetic disease states are linked through the On-line Mendelian Inheritance in Man (OMIM) resource. The reader can ask their own questions of the resource at http://function.rcsb.org:8080/pdb/function_distribution/index.html. The resource should prove particularly useful to the structural genomics community as they strive to undertake large-scale structure determination with a goal of improving our understanding of protein functional space." } @Article{Nikolova04, author = "N. Nikolova and J. Jaworska", title = "Approaches to measure chemical similarity - A review", journal = "QSAR Comb. Sci.", year = "2004", volume = "22", pages = "1006-1026", } @Article{Hert04, author = "J. Hert and P. Willett and D.J. Wilton", title = "Comparison of fingerprint-based methods for virtual screening using multiple bioactive reference structures", journal = "J. Chem. Inf. Comput. Sci.", year = "2004", volume = "44", pages = "1177-1185", } @Article{Gelly06, author = "J. Gelly and A.G. {de Brevern} and S. Hazout", title = "{Protein Peeling:} an approach for splitting a 3D protein structure into compact fragments", journal = "Bioinformatics", volume = "22", number = "2", year = "2006", pages = "129-133", abstract = "Motivation: The object of this study is to propose a new method to identify small compact units that compose protein three-dimensional structures. These fragments, called protein units (PU)', are a new level of description to well understand and analyze the organization of protein structures. The method only works from the contact probability matrix, i.e. the inter Calpha-distances translated into probabilities. It uses the principle of conventional hierarchical clustering, leading to a series of nested partitions of the 3D structure. Every step aims at dividing optimally a unit into 2 or 3 subunits according to a criterion called partition index' assessing the structural independence of the subunits newly defined. Moreover, an entropy-derived squared correlation R is used for assessing globally the protein structure dissection. The method is compared to other splitting algorithms and shows relevant performance. Availability: An Internet server with dedicated tools is available at http://www.ebgm.jussieu.fr/~gelly/ Contact: debrevern@ebgm.jussieu.fr.", }