@inproceedings{73b06c77c1334a2a87f06d8d6f2ba563,
title = "The Role of Hydrophobicity in Peptide-MHC Binding",
abstract = "Major Histocompability Complex (MHC) Class I molecules provide a pathway for cells to present endogenous peptides to the immune system, allowing it to distinguish healthy cells from those infected by pathogens. Software tools based on neural networks such as NetMHC and NetMHCpan predict whether peptides will bind to variants of MHC molecules. These tools are trained with experimental data, consisting of the amino acid sequence of peptides and their observed binding strength. Such tools generally do not explicitly consider hydrophobicity, a significant biochemical factor relevant to peptide binding. It was observed that these tools predict that some highly hydrophobic peptides will be strong binders, which biochemical factors suggest is incorrect. This paper investigates the correlation of the hydrophobicity of 9-mer peptides with their predicted binding strength to the MHC variant HLA-A*0201 for these software tools. Two studies were performed, one using the data that the neural networks were trained on and the other using a sample of the human proteome. A significant bias within NetMHC-4.0 towards predicting highly hydrophobic peptides as strong binders was observed in both studies. This suggests that hydrophobicity should be included in the training data of the neural networks. Retraining the neural networks with such biochemical annotations of hydrophobicity could increase the accuracy of their predictions, increasing their impact in applications such as vaccine design and neoantigen identification.",
keywords = "MHC Class I, Machine learning, Neural networks, Peptide",
author = "Arnav Solanki and Marc Riedel and James Cornette and Julia Udell and Ishaan Koratkar and George Vasmatzis",
note = "Funding Information: Supported by NSF Grant 2036064. Publisher Copyright: {\textcopyright} 2021, Springer Nature Switzerland AG.; 3rd International Symposium on Mathematical and Computational Oncology, ISMCO 2021 ; Conference date: 11-10-2021 Through 13-10-2021",
year = "2021",
doi = "10.1007/978-3-030-91241-3_3",
language = "English (US)",
isbn = "9783030912406",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "24--37",
editor = "George Bebis and Terry Gaasterland and Mamoru Kato and Mohammad Kohandel and Kathleen Wilkie",
booktitle = "Mathematical and Computational Oncology - Third International Symposium, ISMCO 2021, Proceedings",
}