@inproceedings{9f5bc2fb465249f29c9bdaabbc487a09,
title = "A machine learning approach for predicting Antibody Properties",
abstract = "This paper used an amino acid location-based sequence encoding as a feature extraction techniques to identify single chains antibody molecules that bind to B-lymphocyte stimulator (BLyS) antigen. The data were manually derived from the European patent (EP2275449B1) text. The dataset was cleaned and made suitable for the machine learning models. The accuracy, precision and recall achieved across individual descriptors (Membrane and Soluble) for Logistic regression, KNN, KSVM, and Random Forest Tree was above 80%. However, it was much lower for the Na{\"i}ve Bayes except for the precision score. The promising accuracy value achieved from such a minimal dataset has significant implications for the drug discovery process – this includes considerable savings in time and resources. ",
keywords = "Amino acid sequence, Antibody, Antigen, Infectious disease, Machine learning",
author = "Egaji, {Oche Alexander} and Seamus Ballard-Smith and Ikram Asghar and Mark Griffiths",
note = "Funding Information: The authors will like to acknowledge the European Regional Development Fund (ERDF) and the Welsh Government for funding this study. Our gratitude goes to all members of the Centre of Excellence in Mobile and Emerging Technologies (CEMET), the University of South Wales for their contribution in various capacity in this study. Publisher Copyright: {\textcopyright} 2020 ACM. Copyright: Copyright 2020 Elsevier B.V., All rights reserved.",
year = "2020",
month = jun,
day = "28",
doi = "10.1145/3418981.3418983",
language = "English",
isbn = "978-1-4503-8770-5",
series = "ACM International Conference Proceeding Series",
publisher = "Association for Computing Machinery",
pages = "20--24",
booktitle = "Proceedings of ICICM 2020 - 2020 10th International Conference on Information Communication and Management, Worshop",
}