@article {Poirier19009795, author = {Canelle Poirier and Yulin Hswen and Guillaume Bouzill{\'e} and Marc Cuggia and Audrey Lavenu and John S Brownstein and Thomas Brewer and Mauricio Santillana}, title = {Influenza forecasting for the French regions by using EHR, web and climatic data sources with an ensemble approach ARGONet}, elocation-id = {19009795}, year = {2019}, doi = {10.1101/19009795}, publisher = {Cold Spring Harbor Laboratory Press}, abstract = {Effective and timely disease surveillance systems have the potential to help public health officials design interventions to mitigate the effects of disease outbreaks. Currently, healthcare-based disease monitoring systems in France offer influenza activity information that lags real-time by 1 to 3 weeks. This temporal data gap introduces uncertainty that prevents public health officials from having a timely perspective on the population-level disease activity. Here, we present a machine-learning modeling approach that produces real-time estimates and short-term forecasts of influenza activity for the 12 continental regions of France by leveraging multiple disparate data sources that include, Google search activity, real-time and local weather information, flu-related Twitter micro-blogs, electronic health records data, and historical disease activity synchronicities across regions. Our results show that all data sources contribute to improving influenza surveillance and that machine-learning ensembles that combine all data sources lead to accurate and timely predictions.Author summary The role of public health is to protect the health of populations by providing the right intervention to the right population at the right time. In France and all around the world, Influenza is a major public health problem. Traditional surveillance systems produce estimates of influenza-like illness (ILI) incidence rates, but with one-to three-week delay. Accurate real-time monitoring systems of influenza outbreaks could be useful for public health decisions. By combining different data sources and different statistical models, we propose an accurate and timely forecasting platform to track the flu in France at a spatial resolution that, to our knowledge, has not been explored before.Competing Interest StatementThe authors have declared no competing interest.Funding StatementCP, MC, GB and AL were partially funded by the French National Research Agency inside the Integrating and Sharing Health Data for Research Project (Grant No.452ANR-15-CE19-0024). MS and CP were partially funded by the National Institute of General Medical Sciences of the National Institutes of Health under Award Number R01GM130668. The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.Author DeclarationsAll relevant ethical guidelines have been followed and any necessary IRB and/or ethics committee approvals have been obtained.Not ApplicableAll necessary patient/participant consent has been obtained and the appropriate institutional forms have been archived.Not ApplicableAny clinical trials involved have been registered with an ICMJE-approved registry such as ClinicalTrials.gov and the trial ID is included in the manuscript.Not ApplicableI have followed all appropriate research reporting guidelines and uploaded the relevant Equator, ICMJE or other checklist(s) as supplementary files, if applicable.YesAll data cannot be shared publicly, in particular EHR data, due to the protection of patient data.}, URL = {https://www.medrxiv.org/content/early/2019/11/25/19009795}, eprint = {https://www.medrxiv.org/content/early/2019/11/25/19009795.full.pdf}, journal = {medRxiv} }