@article {Xiong2020.06.29.20141978, author = {Di Xiong and Lu Zhang and Gregory L. Watson and Phillip Sundin and Teresa Bufford and Joseph A. Zoller and John Shamshoian and Marc A. Suchard and Christina M. Ramirez}, title = {Pseudo-Likelihood Based Logistic Regression for Estimating COVID-19 Infection and Case Fatality Rates by Gender, Race, and Age in California}, elocation-id = {2020.06.29.20141978}, year = {2020}, doi = {10.1101/2020.06.29.20141978}, publisher = {Cold Spring Harbor Laboratory Press}, abstract = {In emerging epidemics, early estimates of key epidemiological characteristics of the disease are critical for guiding public policy. In particular, identifying high risk population subgroups aids policymakers and health officials in combatting the epidemic. This has been challenging during the coronavirus disease 2019 (COVID-19) pandemic, because governmental agencies typically release aggregate COVID-19 data as marginal summary statistics of patient demographics. These data may identify disparities in COVID-19 outcomes between broad population subgroups, but do not provide comparisons between more granular population subgroups defined by combinations of multiple demographics.We introduce a method that overcomes the limitations of aggregated summary statistics and yields estimates of COVID-19 infection and case fatality rates {\textemdash} key quantities for guiding public policy related to the control and prevention of COVID-19 {\textemdash} for population subgroups across combinations of demographic characteristics. Our approach uses pseudo-likelihood based logistic regression to combine aggregate COVID-19 case and fatality data with population-level demographic survey data to estimate infection and case fatality rates for population subgroups across combinations of demographic characteristics.We illustrate our method on California COVID-19 data to estimate test-based infection and case fatality rates for population subgroups defined by gender, age, and race and ethnicity. Our analysis indicates that in California, males have higher test-based infection rates and test-based case fatality rates across age and race/ethnicity groups, with the gender gap widening with increasing age. Although elderly infected with COVID-19 are at an elevated risk of mortality, the test-based infection rates do not increase monotonically with age. LatinX and African Americans have higher test-based infection rates than other race/ethnicity groups. The subgroups with the highest 5 test-based case fatality rates are African American male, Multi-race male, Asian male, African American female, and American Indian or Alaska Native male, indicating that African Americans are an especially vulnerable California subpopulation.Competing Interest StatementThe authors have declared no competing interest.Funding StatementThe authors received no specific funding for this work.Author DeclarationsI confirm all relevant ethical guidelines have been followed, and any necessary IRB and/or ethics committee approvals have been obtained.YesThe details of the IRB/oversight body that provided approval or exemption for the research described are given below:No IRB body is required for this study.All necessary patient/participant consent has been obtained and the appropriate institutional forms have been archived.YesI understand that all clinical trials and any other prospective interventional studies must be registered with an ICMJE-approved registry, such as ClinicalTrials.gov. I confirm that any such study reported in the manuscript has been registered and the trial registration ID is provided (note: if posting a prospective study registered retrospectively, please provide a statement in the trial ID field explaining why the study was not registered in advance).YesI have followed all appropriate research reporting guidelines and uploaded the relevant EQUATOR Network research reporting checklist(s) and other pertinent material as supplementary files, if applicable.YesThe data underlying the results presented in the study are based on the most recent COVID-19 case and fatality data from the California Department of Public Health (CDPH) and population-level demo-graphic data from the California Health Interview Survey (CHIS). https://www.cdph.ca.gov/Programs/CID/DCDC/Pages/COVID-19/Race-Ethnicity.aspx https://update.covid19.ca.gov/$\#$top https://www.cdph.ca.gov/Programs/CID/DCDC/Pages/COVID-19/COVID-19-Cases-by-Age-Group.aspx https://healthpolicy.ucla.edu/chis/data/Pages/GetCHISData.aspx}, URL = {https://www.medrxiv.org/content/early/2020/07/01/2020.06.29.20141978}, eprint = {https://www.medrxiv.org/content/early/2020/07/01/2020.06.29.20141978.full.pdf}, journal = {medRxiv} }