@inproceedings{5c101abd5baf4acea466ec5ad9e426a4,
title = "SPEAR: Self-supervised post-training enhancer for molecule optimization",
abstract = "The molecular optimization task is to generate molecules that are similar to a target molecule but with better chemical properties. Deep Generative Models (DGMs) have shown initial success in automatic molecule optimization. However, the training of DGMs often suffers from limited labeled molecule pairs due to the ad-hoc and restricted molecule pair construction. To solve this challenge and leverage the entire unpaired molecule database, we propose Self-Supervised Post-training EnhAnceR method (SPEAR) to enhance any graph-based DGMs for molecule optimization. SPEAR mines molecular structure knowledge and learns the molecule generation procedure in a purely self-supervised fashion. Unlike most self-supervised deep learning models that rely on pre-training for better molecule representation, the SPEAR method is applied as post-processing step to enhance molecule optimization during inference time for DGMs without additional training. Our SPEAR model can be efficiently incorporated into any DGM model as part of the inference procedure. We evaluated SPEAR against several state-of-the-art DGMs, SPEAR successfully improved the performance of all DGMs and obtained 5-21% relative improvement over its corresponding DGM models in terms of success rate.",
keywords = "drug discovery, healthcare, molecule optimization",
author = "Tianfan Fu and Cao Xiao and Kexin Huang and Glass, {Lucas M.} and Jimeng Sun",
note = "Funding Information: This work was in part supported by the National Science Foundation award SCH-2014438, PPoSS 2028839, IIS-1838042, the National Institute of Health award NIH R01 1R01NS107291-01 and OSF Healthcare. Publisher Copyright: {\textcopyright} 2021 Owner/Author.; 12th ACM Conference on Bioinformatics, Computational Biology, and Health Informatics, BCB 2021 ; Conference date: 01-08-2021 Through 04-08-2021",
year = "2021",
month = jan,
day = "18",
doi = "10.1145/3459930.3469530",
language = "English (US)",
series = "Proceedings of the 12th ACM Conference on Bioinformatics, Computational Biology, and Health Informatics, BCB 2021",
publisher = "Association for Computing Machinery",
booktitle = "Proceedings of the 12th ACM Conference on Bioinformatics, Computational Biology, and Health Informatics, BCB 2021",
address = "United States",
}