@article {Alanazi2020.06.10.20127225, author = {Eisa Alanazi and Abdulaziz Alashaikh and Sarah Alqurashi and Aued Alanazi}, title = {Identifying and Ranking Common COVID-19 Symptoms from Arabic Twitter}, elocation-id = {2020.06.10.20127225}, year = {2020}, doi = {10.1101/2020.06.10.20127225}, publisher = {Cold Spring Harbor Laboratory Press}, abstract = {Background Massive amount of covid-19 related data is generated everyday by Twitter users. Self-reports of covid-19 symptoms on Twitter can reveal a great deal about the disease and its prevalence in the community. In particular, self-reports can be used as a valuable resource to learn more about the common symptoms and whether their order of appearance differs among different groups in the community. With sufficient available data, this has the potential of developing a covid-19 risk-assessment system that is tailored toward specific group of people.Objective The aim of this study is to identify the most common symptoms reported by covid-19 patients in the Arabic language and order the symptoms appearance based on the collected data.Methods We search the Arabic content of Twitter for personal reports of covid-19 symptoms from March 1st to May 27th, 2020. We identify 463 Arabic users who tweeted testing positive for covid-19 and extract the symptoms they publicly associate with covid-19. Furthermore, we ask them directly through personal messages to opt in and rank the appearance of the first three symptoms they experienced right before (or after) diagnosed with covid-19. Finally, we track their Twitter timeline to identify additional symptoms that were mentioned within {\textpm}5 days from the day of tweeting having covid-19. In summary, a list of 270 covid-19 reports were collected and symptoms were (at least partially) ranked from early to late.Results The collected reports contained roughly 900 symptoms originated from 74\% (n=201) male and 26\% (n=69) female Twitter users. The majority (82\%) of the tracked users were living in Saudi Arabia (46\%) and Kuwait (36\%). Furthermore, 13\% (n=36) of the collected reports were asymptomatic. Out of the users with symptoms (n=234), 66\% (n=180) provided a chronological order of appearance for at least three symptoms.Fever 59\% (n=139), Headache 43\% (n=101), and Anosmia 39\% (n=91) were found to be the top three symptoms mentioned by the reports. They count also for the top-3 common first symptoms in a way that 28\% (n=65) said their covid journey started with a Fever, 15\% (n=34) with a Headache and 12\% (n=28) with Anosmia. Out of the Saudi symptomatic reported cases (n=110), the most common three symptoms were Fever 59\% (n=65), Anosmia 42\% (n=46), and Headache 38\% (n=42).Conclusions This study demonstrates that Twitter is a valuable resource to analyze and identify COVID-19 early symptoms within the Arabic content of Twitter. It also suggests the possibility of developing a real-time covid-19 risk estimator based on the users{\textquoteright} tweets.Competing Interest StatementThe authors have declared no competing interest.Funding StatementThis work was supported by King Abdulaziz City for Science and Technology (Grant Number: 5-20-01-007-0033).Author DeclarationsI confirm all relevant ethical guidelines have been followed, and any necessary IRB and/or ethics committee approvals have been obtained.YesThe details of the IRB/oversight body that provided approval or exemption for the research described are given below:CIADA Ethical Committee, Umm Al-Qura University, Saudi ArabiaAll necessary patient/participant consent has been obtained and the appropriate institutional forms have been archived.YesI understand that all clinical trials and any other prospective interventional studies must be registered with an ICMJE-approved registry, such as ClinicalTrials.gov. I confirm that any such study reported in the manuscript has been registered and the trial registration ID is provided (note: if posting a prospective study registered retrospectively, please provide a statement in the trial ID field explaining why the study was not registered in advance).YesI have followed all appropriate research reporting guidelines and uploaded the relevant EQUATOR Network research reporting checklist(s) and other pertinent material as supplementary files, if applicable.YesData is continously updated and available upon requestAbbreviationsAPIapplication programming interfaceCOVID-19coronavirus disease}, URL = {https://www.medrxiv.org/content/early/2020/06/12/2020.06.10.20127225}, eprint = {https://www.medrxiv.org/content/early/2020/06/12/2020.06.10.20127225.full.pdf}, journal = {medRxiv} }