@inproceedings{1acc8648adf84071b78291b7c5a07f29,
title = "Transforming the Language of Life: Transformer Neural Networks for Protein Prediction Tasks",
abstract = "The scientific community is rapidly generating protein sequence information, but only a fraction of these proteins can be experimentally characterized. While promising deep learning approaches for protein prediction tasks have emerged, they have computational limitations or are designed to solve a specific task. We present a Transformer neural network that pre-Trains task-Agnostic sequence representations. This model is fine-Tuned to solve two different protein prediction tasks: protein family classification and protein interaction prediction. Our method is comparable to existing state-of-The-Art approaches for protein family classification while being much more general than other architectures. Further, our method outperforms all other approaches for protein interaction prediction. These results offer a promising framework for fine-Tuning the pre-Trained sequence representations for other protein prediction tasks.",
keywords = "Neural networks, protein family classification, protein-protein interaction prediction, COVID-19",
author = "Ananthan Nambiar and Maeve Heflin and Simon Liu and Sergei Maslov and Mark Hopkins and Anna Ritz",
note = "Funding Information: This work has been supported by the National Science Foundation (awards #1750981 and #1725729). This work has also been partially supported by the Google Cloud Platform research credits program (to AR, MH, and AN). AN would like to thank Mark Bedau, Norman Packard and the Reed College Artificial Life Lab for insightful discussions and Desiree Odgers for inspiring the idea of taking a linguistic approach to a biological problem.; 11th ACM International Conference on Bioinformatics, Computational Biology and Health Informatics, BCB 2020 ; Conference date: 21-09-2020 Through 24-09-2020",
year = "2020",
month = sep,
day = "21",
doi = "10.1101/2020.06.15.153643",
language = "English (US)",
series = "Proceedings of the 11th ACM International Conference on Bioinformatics, Computational Biology and Health Informatics, BCB 2020",
publisher = "Association for Computing Machinery",
booktitle = "Proceedings of the 11th ACM International Conference on Bioinformatics, Computational Biology and Health Informatics, BCB 2020",
address = "United States",
}