@article {Luellen2020.07.27.20162867, author = {Eric Luellen}, title = {A machine learning explanation of the pathogen-immune relationship of SARS-CoV-2 and machine learning models of prognostic biomarkers to predict asymptomatic or symptomatic infections}, elocation-id = {2020.07.27.20162867}, year = {2020}, doi = {10.1101/2020.07.27.20162867}, publisher = {Cold Spring Harbor Laboratory Press}, abstract = {Asymptomatic people infected during the SARS-CoV-2 pandemic have outnumbered symptomatic people by an approximate ratio of 4:1 with little understanding to date as to why; therefore, they have been difficult to identify. Moreover, studies indicate that most asymptomatic virus-positive patients are infectious, thereby creating a new public health danger via a plethora of {\textquotedblleft}silent spreaders.{\textquotedblright} This data science study identified four novel discoveries that may significantly impact our understanding of the pathogen-immune relationship: (1) Spearman rho correlation coefficients and associated P-values identified 33 of 55 common immune factors have statistically significant associations with SARS-CoV-2 morbidity, their direction (+/-) and strength to inform research and therapies; (2) five machine learning algorithms were applied to 74 observations of these 33 immunological variables and identified three models of prognostic biomarkers that can classify and predict who will be asymptomatic or symptomatic if infected with 94.8\% to 100\% accuracy; (3) a random forest of 200 decision trees ordinally ranked the 33 statistically significant independent predictor variables by their relative importance in predicting SARS-CoV-2 symptoms; and, (4) three different decision-tree algorithms separately identified and validated three immunological biomarkers and levels that nearly always differentiate asymptomatic patients {\textendash} SCGF-β (\> 127637), IL-16 (\> 45), and M-CSF (\> 57). The implications of these findings are they indicate a tool that can identify in advance the 20\% of people who are at higher risk of morbidity from infection and suggests a specific stem-cell factor for therapeutics.Competing Interest StatementThe authors have declared no competing interest.Funding StatementNo external funding was received for this study.Author DeclarationsI confirm all relevant ethical guidelines have been followed, and any necessary IRB and/or ethics committee approvals have been obtained.YesThe details of the IRB/oversight body that provided approval or exemption for the research described are given below:Not applicable.All necessary patient/participant consent has been obtained and the appropriate institutional forms have been archived.YesI understand that all clinical trials and any other prospective interventional studies must be registered with an ICMJE-approved registry, such as ClinicalTrials.gov. I confirm that any such study reported in the manuscript has been registered and the trial registration ID is provided (note: if posting a prospective study registered retrospectively, please provide a statement in the trial ID field explaining why the study was not registered in advance).YesI have followed all appropriate research reporting guidelines and uploaded the relevant EQUATOR Network research reporting checklist(s) and other pertinent material as supplementary files, if applicable.YesThe data is in the public domain.}, URL = {https://www.medrxiv.org/content/early/2020/07/29/2020.07.27.20162867}, eprint = {https://www.medrxiv.org/content/early/2020/07/29/2020.07.27.20162867.full.pdf}, journal = {medRxiv} }