@article{d56eadcdb27f403793e670f4cdfa2ec9,
title = "Physicochemical graph neural network for learning protein–ligand interaction fingerprints from sequence data",
abstract = "In drug discovery, determining the binding affinity and functional effects of small-molecule ligands on proteins is critical. Current computational methods can predict these protein–ligand interaction properties but often lose accuracy without high-resolution protein structures and falter in predicting functional effects. Here we introduce PSICHIC (PhySIcoCHemICal graph neural network), a framework incorporating physicochemical constraints to decode interaction fingerprints directly from sequence data alone. This enables PSICHIC to attain capabilities in decoding mechanisms underlying protein–ligand interactions, achieving state-of-the-art accuracy and interpretability. Trained on identical protein–ligand pairs without structural data, PSICHIC matched and even surpassed leading structure-based methods in binding-affinity prediction. In an experimental library screening for adenosine A1 receptor agonists, PSICHIC discerned functional effects effectively, ranking the sole novel agonist within the top three. PSICHIC{\textquoteright}s interpretable fingerprints identified protein residues and ligand atoms involved in interactions, and helped in unveiling selectivity determinants of protein–ligand interaction. We foresee PSICHIC reshaping virtual screening and deepening our understanding of protein–ligand interactions.",
author = "Koh, \{Huan Yee\} and Nguyen, \{Anh T.N.\} and Shirui Pan and May, \{Lauren T.\} and Webb, \{Geoffrey I.\}",
note = "Funding Information: Research on adenosine receptor signalling was supported by a National Heart Foundation Future Leader Fellowship (101857 to L.T.M.), National Health and Medical Research Council (NHMRC) of Australia Ideas grant (APP2013629 to L.T.M., G.I.W. and A.T.N.N.) and a Department of Health and Aged Care (MRFF) Stem Cell Therapies Mission grant (MRF2015957 to L.T.M. and A.T.N.N.). H.Y.K.\textbackslash{}u2019s scholarship is supported by the Australian Government Research Training Program (RTP) Scholarship and the Australian Research Council under grant ARC DP210100072. High-throughput screening was performed at the National Drug Discovery Centre, WEHI, Parkville, Australia, with support from the Australian Government Medical Research Future Fund (MRFF). Our acknowledgement extends to Cortellis Drug Discovery Intelligence for granting public access to the curated functional effect dataset, and to BioRender for the display elements used in our figures, which were created using BioRender.com . Special thanks to Monash Institute of Pharmaceutical Sciences (MIPS) Monash University for access to the MIPS library, in particular P. Sexton and A. Christopoulos for purchase of the MIPS library and to J. Baell for the design of the library. We thank C. S. Lu for assistance with pharmacological evaluation. Computational resources were generously provided by the Nectar Research Cloud, a collaborative Australian research platform supported by the NCRIS-funded Australian Research Data Commons (ARDC) and the MASSIVE HPC facility. We extend our sincere gratitude to B. K. Koh, H. J. W. Koh and Y. Li for their invaluable feedback on paper writing and figures. Publisher Copyright: {\textcopyright} The Author(s), under exclusive licence to Springer Nature Limited 2024.",
year = "2024",
month = jun,
doi = "10.1038/s42256-024-00847-1",
language = "English",
volume = "6",
pages = "673–687",
journal = "Nature Machine Intelligence",
issn = "2522-5839",
publisher = "Nature Publishing Group",
}