Yago Ferreira e Silva, Harold Hilarion Fokoue and Paulo Ricardo Batista*,
{"title":"","authors":"Yago Ferreira e Silva, Harold Hilarion Fokoue and Paulo Ricardo Batista*, ","doi":"","DOIUrl":"","url":null,"abstract":"","PeriodicalId":44,"journal":{"name":"Journal of Chemical Information and Modeling ","volume":"65 14","pages":"XXX-XXX XXX-XXX"},"PeriodicalIF":5.6,"publicationDate":"2025-07-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://pubs.acs.org/doi/pdf/10.1021/acs.jcim.5c00990","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"144712754","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":2,"RegionCategory":"化学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"OA","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"MutPNI: A Unified Model Architecture for Accurately Predicting the Effects of Mutations on Protein-Nucleic Acid Interactions.","authors":"Zihao Yan,Fang Ge,Ying Zhang,He Yan,Yan Liu,Yi-Heng Zhu,Jiangning Song,Dong-Jun Yu","doi":"10.1021/acs.jcim.5c00756","DOIUrl":"https://doi.org/10.1021/acs.jcim.5c00756","url":null,"abstract":"Missense mutations in DNA- and RNA-binding proteins can disrupt vital interaction networks and frequently lead to disease. However, current methods for predicting changes in binding affinity between protein-DNA and protein-RNA remain fragmented and inefficient. In this study, we introduce MutPNI, a novel general regression model that predicts the effects of missense mutations in DNA-binding and RNA-binding proteins. To achieve this, we integrate feature embeddings from pretrained ESM-2 and ProtT5 protein language models and incorporate energy terms derived from mutant protein structures. We then train the model through a Transformer-based encoder, enabling it to attain PCC values of 0.661 and 0.701 on DNA and RNA benchmark test sets, respectively. Furthermore, our final strategy relies on the same model architecture, rather than identical parameters, to predict mutations in both protein-DNA and protein-RNA complexes, thereby highlighting shared features as well as key distinctions in the two data sets. Finally, the method's high computational efficiency allows for scaling to large biological data sets, offering a robust platform for future research. The web server and data sets for MutPNI are publicly available at https://csbioinformatics.njust.edu.cn/mutpni/ for academic use.","PeriodicalId":44,"journal":{"name":"Journal of Chemical Information and Modeling ","volume":"57 1","pages":""},"PeriodicalIF":5.6,"publicationDate":"2025-07-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"144720042","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":2,"RegionCategory":"化学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"","authors":"","doi":"","DOIUrl":"","url":null,"abstract":"","PeriodicalId":44,"journal":{"name":"Journal of Chemical Information and Modeling ","volume":"65 14","pages":"XXX-XXX XXX-XXX"},"PeriodicalIF":5.6,"publicationDate":"2025-07-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://pubs.acs.org/doi/pdf/10.1021/civ065i014_1964701","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"144712726","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":2,"RegionCategory":"化学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"OA","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"","authors":"Dinesh Kumar Jagannathareddy, and , Durba Roy*, ","doi":"","DOIUrl":"","url":null,"abstract":"","PeriodicalId":44,"journal":{"name":"Journal of Chemical Information and Modeling ","volume":"65 14","pages":"XXX-XXX XXX-XXX"},"PeriodicalIF":5.6,"publicationDate":"2025-07-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://pubs.acs.org/doi/pdf/10.1021/acs.jcim.5c00686","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"144712729","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":2,"RegionCategory":"化学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"OA","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Hassan Ayaz, Asia Nawaz, Sajjad Ahmad, Faisal Ahmad*, Anisa Tariq, Hanbal Ahmad Khan, Iftikhar Ahmed, Sidra Rahman, Muhammad Suleman, Dilber Uzun Ozsahin, Ilker Ozsahin and Yasir Waheed*,
{"title":"","authors":"Hassan Ayaz, Asia Nawaz, Sajjad Ahmad, Faisal Ahmad*, Anisa Tariq, Hanbal Ahmad Khan, Iftikhar Ahmed, Sidra Rahman, Muhammad Suleman, Dilber Uzun Ozsahin, Ilker Ozsahin and Yasir Waheed*, ","doi":"","DOIUrl":"","url":null,"abstract":"","PeriodicalId":44,"journal":{"name":"Journal of Chemical Information and Modeling ","volume":"65 14","pages":"XXX-XXX XXX-XXX"},"PeriodicalIF":5.6,"publicationDate":"2025-07-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://pubs.acs.org/doi/pdf/10.1021/acs.jcim.4c01652","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"144712730","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":2,"RegionCategory":"化学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"OA","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Patryk Tajs, Mateusz Skarupski and Jakub Rydzewski*,
{"title":"","authors":"Patryk Tajs, Mateusz Skarupski and Jakub Rydzewski*, ","doi":"","DOIUrl":"","url":null,"abstract":"","PeriodicalId":44,"journal":{"name":"Journal of Chemical Information and Modeling ","volume":"65 14","pages":"XXX-XXX XXX-XXX"},"PeriodicalIF":5.6,"publicationDate":"2025-07-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://pubs.acs.org/doi/pdf/10.1021/acs.jcim.5c01107","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"144712737","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":2,"RegionCategory":"化学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"OA","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Clauber Henrique Souza da Costa, Camila Auad Beltrão de Freitas, Alberto Monteiro dos Santos, Carlos Gabriel da Silva de Souza, José Rogério A. Silva, Jerônimo Lameira, Vicent Moliner and Munir S. Skaf*,
{"title":"","authors":"Clauber Henrique Souza da Costa, Camila Auad Beltrão de Freitas, Alberto Monteiro dos Santos, Carlos Gabriel da Silva de Souza, José Rogério A. Silva, Jerônimo Lameira, Vicent Moliner and Munir S. Skaf*, ","doi":"","DOIUrl":"","url":null,"abstract":"","PeriodicalId":44,"journal":{"name":"Journal of Chemical Information and Modeling ","volume":"65 14","pages":"XXX-XXX XXX-XXX"},"PeriodicalIF":5.6,"publicationDate":"2025-07-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://pubs.acs.org/doi/pdf/10.1021/acs.jcim.5c00308","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"144712746","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":2,"RegionCategory":"化学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"OA","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Sofiia A Dymura, Oleksandr O Viniichuk, Kostiantyn P Melnykov, Dmytro S Radchenko, Oleksandr O Grygorenko
{"title":"Machine Learning-Based Retention Time Prediction Tool for Routine LC-MS Data Analysis.","authors":"Sofiia A Dymura, Oleksandr O Viniichuk, Kostiantyn P Melnykov, Dmytro S Radchenko, Oleksandr O Grygorenko","doi":"10.1021/acs.jcim.5c00514","DOIUrl":"10.1021/acs.jcim.5c00514","url":null,"abstract":"<p><p>Accurate retention time (<i>R</i><sub>T</sub>) prediction models can significantly improve liquid chromatography-mass spectrometry (LC-MS) data analysis widely used in chemical synthesis. As hundreds of thousands of syntheses are performed annually at Enamine, a large amount of experimental data has been generated internally. In this paper, we present the development of an <i>R</i><sub>T</sub> prediction model based on the GATv2Conv + DL graph neural network (NN) architecture, trained on the internal data and further evaluated using the METLIN SMRT data set. The final model achieved a mean absolute error (MAE) of 2.48 s for the 120 s LC-MS method. We also conducted a detailed analysis of <i>R</i><sub>T</sub> prediction errors and determined that the interval between <i>R</i><sub>T</sub> - 7.12 s and <i>R</i><sub>T</sub> + 9.58 s contained over 95% of the data. The developed model has been successfully integrated into the existing in-house LC-MS analysis toolkit, enhancing its predictive and analytical capabilities. Additionally, we have published a curated subset of 20,000 data points from our internal data set to support community benchmarking and further research.</p>","PeriodicalId":44,"journal":{"name":"Journal of Chemical Information and Modeling ","volume":" ","pages":"7415-7425"},"PeriodicalIF":5.3,"publicationDate":"2025-07-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"144641241","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":2,"RegionCategory":"化学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Rıza Özçelik, Helena Brinkmann, Emanuele Criscuolo, Francesca Grisoni
{"title":"Generative Deep Learning for de Novo Drug Design─A Chemical Space Odyssey.","authors":"Rıza Özçelik, Helena Brinkmann, Emanuele Criscuolo, Francesca Grisoni","doi":"10.1021/acs.jcim.5c00641","DOIUrl":"10.1021/acs.jcim.5c00641","url":null,"abstract":"<p><p>In recent years, generative deep learning has emerged as a transformative approach in drug design, promising to explore the vast chemical space and generate novel molecules with desired biological properties. This perspective examines the challenges and opportunities of applying generative models to drug discovery, focusing on the intricate tasks related to small molecule generation, evaluation, and prioritization. Central to this process is navigating conflicting information from diverse sources─balancing chemical diversity, synthesizability, and bioactivity. We discuss the current state of generative methods, their optimization, and the critical need for robust evaluation protocols. By mapping this evolving landscape, we outline key building blocks, inherent dilemmas, and future directions in the journey to fully harness generative deep learning in the \"chemical odyssey\" of drug design.</p>","PeriodicalId":44,"journal":{"name":"Journal of Chemical Information and Modeling ","volume":" ","pages":"7352-7372"},"PeriodicalIF":5.3,"publicationDate":"2025-07-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://www.ncbi.nlm.nih.gov/pmc/articles/PMC12308806/pdf/","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"144598911","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":2,"RegionCategory":"化学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"OA","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Bingjia Yang,Yunsie Chung,Archer Y Yang,Bo Yuan,Tianchi Chen,Xiang Yu
{"title":"QComp: A QSAR-Based Imputation Framework for Drug Discovery.","authors":"Bingjia Yang,Yunsie Chung,Archer Y Yang,Bo Yuan,Tianchi Chen,Xiang Yu","doi":"10.1021/acs.jcim.5c00059","DOIUrl":"https://doi.org/10.1021/acs.jcim.5c00059","url":null,"abstract":"In drug discovery, in vitro and in vivo experiments generate biochemical activity data that are crucial for evaluating the efficacy and toxicity of compounds. These data sets are massive, sparse, and ever-evolving. Quantitative structure-activity relationship (QSAR) models, which predict biochemical activities from compound structures, face challenges in integrating the evolving experimental data agilely as studies progress. We developed QSAR-Complete (QComp), an imputation framework, to address these challenges. While QSAR models are updated at a slow pace through extensive retraining on enlarging data sets, QComp leverages existing QSAR models to immediately exploit new experimental data and improves the imputation of missing data. We demonstrate that the improvement is robust and substantial for imputing in vivo assays with only in vitro experimental data. Additionally, QComp assists in finding the optimal sequence of experiments by quantifying the reduction in statistical uncertainty for specific end points, aiding in rational decision-making throughout the drug discovery process.","PeriodicalId":44,"journal":{"name":"Journal of Chemical Information and Modeling ","volume":"27 1","pages":""},"PeriodicalIF":5.6,"publicationDate":"2025-07-27","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"144720043","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":2,"RegionCategory":"化学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}