{"markup":"\u003C?xml version=\u00221.0\u0022 encoding=\u0022UTF-8\u0022 ?\u003E\n    \u003Chtml version=\u0022HTML+RDFa+MathML 1.1\u0022\n    xmlns:content=\u0022http:\/\/purl.org\/rss\/1.0\/modules\/content\/\u0022\n    xmlns:dc=\u0022http:\/\/purl.org\/dc\/terms\/\u0022\n    xmlns:foaf=\u0022http:\/\/xmlns.com\/foaf\/0.1\/\u0022\n    xmlns:og=\u0022http:\/\/ogp.me\/ns#\u0022\n    xmlns:rdfs=\u0022http:\/\/www.w3.org\/2000\/01\/rdf-schema#\u0022\n    xmlns:sioc=\u0022http:\/\/rdfs.org\/sioc\/ns#\u0022\n    xmlns:sioct=\u0022http:\/\/rdfs.org\/sioc\/types#\u0022\n    xmlns:skos=\u0022http:\/\/www.w3.org\/2004\/02\/skos\/core#\u0022\n    xmlns:xsd=\u0022http:\/\/www.w3.org\/2001\/XMLSchema#\u0022\n    xmlns:mml=\u0022http:\/\/www.w3.org\/1998\/Math\/MathML\u0022\u003E\n  \u003Chead\u003E\u003Cscript type=\u0022text\/javascript\u0022 src=\u0022\/\/cdn.jsdelivr.net\/qtip2\/2.2.1\/jquery.qtip.min.js\u0022\u003E\u003C\/script\u003E\n\u003Cscript type=\u0022text\/javascript\u0022 src=\u0022https:\/\/www.medrxiv.org\/sites\/default\/files\/js\/js_YjAJQgxDlFX6S-O02jj9jCrVbrwlY3CGgCg1FzPlvBs.js\u0022\u003E\u003C\/script\u003E\n\u003Cscript type=\u0022text\/javascript\u0022\u003E\n\u003C!--\/\/--\u003E\u003C![CDATA[\/\/\u003E\u003C!--\nif(typeof window.MathJax === \u0022undefined\u0022) window.MathJax = { menuSettings: { zoom: \u0022Click\u0022 } };\n\/\/--\u003E\u003C!]]\u003E\n\u003C\/script\u003E\n\u003Cscript type=\u0022text\/javascript\u0022 src=\u0022https:\/\/www.medrxiv.org\/sites\/default\/files\/js\/js_waP91NpgGpectm_6Y2XDEauLJ8WCSCBKmmA87unpp2E.js\u0022\u003E\u003C\/script\u003E\n\u003Cscript type=\u0022text\/javascript\u0022 src=\u0022https:\/\/www.googletagmanager.com\/gtag\/js?id=G-0K57TCX5BY\u0022\u003E\u003C\/script\u003E\n\u003Cscript type=\u0022text\/javascript\u0022\u003E\n\u003C!--\/\/--\u003E\u003C![CDATA[\/\/\u003E\u003C!--\nwindow.dataLayer = window.dataLayer || [];function gtag(){dataLayer.push(arguments)};gtag(\u0022js\u0022, new Date());gtag(\u0022set\u0022, \u0022developer_id.dMDhkMT\u0022, true);gtag(\u0022config\u0022, \u0022G-0K57TCX5BY\u0022, {\u0022groups\u0022:\u0022default\u0022,\u0022anonymize_ip\u0022:true});\n\/\/--\u003E\u003C!]]\u003E\n\u003C\/script\u003E\n\u003Cscript type=\u0022text\/javascript\u0022\u003E\n\u003C!--\/\/--\u003E\u003C![CDATA[\/\/\u003E\u003C!--\njQuery.extend(Drupal.settings, {\u0022basePath\u0022:\u0022\\\/\u0022,\u0022pathPrefix\u0022:\u0022\u0022,\u0022highwire\u0022:{\u0022ac\u0022:{\u0022medrxiv;2025.07.01.25330655v2\u0022:{\u0022access\u0022:{\u0022full\u0022:true},\u0022pisa_id\u0022:\u0022medrxiv;2025.07.01.25330655v2\u0022,\u0022apath\u0022:\u0022\u0022,\u0022jcode\u0022:\u0022medrxiv\u0022}},\u0022processed\u0022:[\u0022highwire_math\u0022],\u0022markup\u0022:[{\u0022requested\u0022:\u0022full-text\u0022,\u0022variant\u0022:\u0022full-text\u0022,\u0022view\u0022:\u0022full\u0022,\u0022pisa\u0022:\u0022medrxiv;2025.07.01.25330655v2\u0022}]},\u0022instances\u0022:\u0022{\\u0022highwire_abstract_tooltip\\u0022:{\\u0022content\\u0022:{\\u0022text\\u0022:\\u0022\\u0022},\\u0022style\\u0022:{\\u0022tip\\u0022:{\\u0022width\\u0022:20,\\u0022height\\u0022:20,\\u0022border\\u0022:1,\\u0022offset\\u0022:0,\\u0022corner\\u0022:true},\\u0022classes\\u0022:\\u0022qtip-custom hw-tooltip hw-abstract-tooltip qtip-shadow qtip-rounded\\u0022,\\u0022classes_custom\\u0022:\\u0022hw-tooltip hw-abstract-tooltip\\u0022},\\u0022position\\u0022:{\\u0022at\\u0022:\\u0022right center\\u0022,\\u0022my\\u0022:\\u0022left center\\u0022,\\u0022viewport\\u0022:true,\\u0022adjust\\u0022:{\\u0022method\\u0022:\\u0022shift\\u0022}},\\u0022show\\u0022:{\\u0022event\\u0022:\\u0022mouseenter click \\u0022,\\u0022solo\\u0022:true},\\u0022hide\\u0022:{\\u0022event\\u0022:\\u0022mouseleave \\u0022,\\u0022fixed\\u0022:1,\\u0022delay\\u0022:\\u0022100\\u0022}},\\u0022highwire_author_tooltip\\u0022:{\\u0022content\\u0022:{\\u0022text\\u0022:\\u0022\\u0022},\\u0022style\\u0022:{\\u0022tip\\u0022:{\\u0022width\\u0022:15,\\u0022height\\u0022:15,\\u0022border\\u0022:1,\\u0022offset\\u0022:0,\\u0022corner\\u0022:true},\\u0022classes\\u0022:\\u0022qtip-custom hw-tooltip hw-author-tooltip qtip-shadow qtip-rounded\\u0022,\\u0022classes_custom\\u0022:\\u0022hw-tooltip hw-author-tooltip\\u0022},\\u0022position\\u0022:{\\u0022at\\u0022:\\u0022top center\\u0022,\\u0022my\\u0022:\\u0022bottom center\\u0022,\\u0022viewport\\u0022:true,\\u0022adjust\\u0022:{\\u0022method\\u0022:\\u0022\\u0022}},\\u0022show\\u0022:{\\u0022event\\u0022:\\u0022mouseenter \\u0022,\\u0022solo\\u0022:true},\\u0022hide\\u0022:{\\u0022event\\u0022:\\u0022mouseleave \\u0022,\\u0022fixed\\u0022:1,\\u0022delay\\u0022:\\u0022100\\u0022}},\\u0022highwire_reflinks_tooltip\\u0022:{\\u0022content\\u0022:{\\u0022text\\u0022:\\u0022\\u0022},\\u0022style\\u0022:{\\u0022tip\\u0022:{\\u0022width\\u0022:15,\\u0022height\\u0022:15,\\u0022border\\u0022:1,\\u0022mimic\\u0022:\\u0022top center\\u0022,\\u0022offset\\u0022:0,\\u0022corner\\u0022:true},\\u0022classes\\u0022:\\u0022qtip-custom hw-tooltip hw-ref-link-tooltip qtip-shadow qtip-rounded\\u0022,\\u0022classes_custom\\u0022:\\u0022hw-tooltip hw-ref-link-tooltip\\u0022},\\u0022position\\u0022:{\\u0022at\\u0022:\\u0022bottom left\\u0022,\\u0022my\\u0022:\\u0022top left\\u0022,\\u0022viewport\\u0022:true,\\u0022adjust\\u0022:{\\u0022method\\u0022:\\u0022flip\\u0022}},\\u0022show\\u0022:{\\u0022event\\u0022:\\u0022mouseenter \\u0022,\\u0022solo\\u0022:true},\\u0022hide\\u0022:{\\u0022event\\u0022:\\u0022mouseleave \\u0022,\\u0022fixed\\u0022:1,\\u0022delay\\u0022:\\u0022100\\u0022}}}\u0022,\u0022qtipDebug\u0022:\u0022{\\u0022leaveElement\\u0022:0}\u0022,\u0022googleanalytics\u0022:{\u0022account\u0022:[\u0022G-0K57TCX5BY\u0022],\u0022trackOutbound\u0022:1,\u0022trackMailto\u0022:1,\u0022trackDownload\u0022:1,\u0022trackDownloadExtensions\u0022:\u00227z|aac|arc|arj|asf|asx|avi|bin|csv|doc(x|m)?|dot(x|m)?|exe|flv|gif|gz|gzip|hqx|jar|jpe?g|js|mp(2|3|4|e?g)|mov(ie)?|msi|msp|pdf|phps|png|ppt(x|m)?|pot(x|m)?|pps(x|m)?|ppam|sld(x|m)?|thmx|qtm?|ra(m|r)?|sea|sit|tar|tgz|torrent|txt|wav|wma|wmv|wpd|xls(x|m|b)?|xlt(x|m)|xlam|xml|z|zip\u0022,\u0022trackColorbox\u0022:1},\u0022ajaxPageState\u0022:{\u0022js\u0022:{\u0022\\\/\\\/cdn.jsdelivr.net\\\/qtip2\\\/2.2.1\\\/jquery.qtip.min.js\u0022:1,\u0022sites\\\/all\\\/modules\\\/highwire\\\/highwire\\\/plugins\\\/highwire_markup_process\\\/js\\\/highwire_article_reference_popup.js\u0022:1,\u0022sites\\\/all\\\/modules\\\/highwire\\\/highwire\\\/plugins\\\/highwire_markup_process\\\/js\\\/highwire_at_symbol.js\u0022:1,\u00220\u0022:1,\u0022sites\\\/all\\\/modules\\\/contrib\\\/google_analytics\\\/googleanalytics.js\u0022:1,\u0022https:\\\/\\\/www.googletagmanager.com\\\/gtag\\\/js?id=G-0K57TCX5BY\u0022:1,\u00221\u0022:1}}});\n\/\/--\u003E\u003C!]]\u003E\n\u003C\/script\u003E\n\u003Clink type=\u0022text\/css\u0022 rel=\u0022stylesheet\u0022 href=\u0022https:\/\/www.medrxiv.org\/sites\/default\/files\/advagg_css\/css__dn-cpI1YtkU_iLHgA5WhlkxgYWyat_IxjF_B-WSYrpE__a9hIbt0eaZ7d5nhwnm2weG8R_2eXK4EvoOx9dOxouHE__QrrGUc7CpljPR5Aph-ukPbcwtK4AWrHGwCEXJ_k1V_c.css\u0022 media=\u0022all\u0022 \/\u003E\n\u003Clink type=\u0022text\/css\u0022 rel=\u0022stylesheet\u0022 href=\u0022\/\/cdn.jsdelivr.net\/qtip2\/2.2.1\/jquery.qtip.min.css\u0022 media=\u0022all\u0022 \/\u003E\n\u003Clink type=\u0022text\/css\u0022 rel=\u0022stylesheet\u0022 href=\u0022https:\/\/www.medrxiv.org\/sites\/default\/files\/advagg_css\/css__HGACIFBlu2o05y3afvqlt5wrE_5Dn6MXsexfuEpeIwg__t4SOPxucAPoV3Os7g8dXqyMB1HRXQridRJ82X7nE33E__QrrGUc7CpljPR5Aph-ukPbcwtK4AWrHGwCEXJ_k1V_c.css\u0022 media=\u0022all\u0022 \/\u003E\n\u003Clink rel=\u0027stylesheet\u0027 type=\u0027text\/css\u0027 href=\u0027\/sites\/all\/modules\/contrib\/panels\/plugins\/layouts\/onecol\/onecol.css\u0027 \/\u003E\u003C\/head\u003E\u003Cbody\u003E\u003Cdiv class=\u0022panels-ajax-tab-panel panels-ajax-tab-panel-article-tab-full-text\u0022\u003E\u003Cdiv class=\u0022panel-display panel-1col clearfix\u0022 \u003E\n  \u003Cdiv class=\u0022panel-panel panel-col\u0022\u003E\n    \u003Cdiv\u003E\u003Cdiv class=\u0022panel-pane pane-highwire-markup\u0022 \u003E\n  \n      \n  \n  \u003Cdiv class=\u0022pane-content\u0022\u003E\n    \u003Cdiv class=\u0022highwire-markup\u0022\u003E\u003Cdiv xmlns=\u0022http:\/\/www.w3.org\/1999\/xhtml\u0022 data-highwire-cite-ref-tooltip-instance=\u0022highwire_reflinks_tooltip\u0022 class=\u0022content-block-markup\u0022 xmlns:xhtml=\u0022http:\/\/www.w3.org\/1999\/xhtml\u0022\u003E\u003Cdiv class=\u0022article fulltext-view \u0022\u003E\u003Cspan class=\u0022highwire-journal-article-marker-start\u0022\u003E\u003C\/span\u003E\u003Cdiv class=\u0022section abstract\u0022 id=\u0022abstract-1\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EAbstract\u003C\/h2\u003E\u003Cp id=\u0022p-2\u0022\u003EThe growing use of large language models (LLMs) for biomedical question answering raises concerns about the accuracy and evidentiary support of their responses. To address this, we present \u003Cem\u003EAnswered with Evidence\u003C\/em\u003E, a framework for evaluating whether LLM generated answers are grounded in scientific literature. We analyzed thousands of physician-submitted questions using a comparative pipeline across seven LLMs grounded in different evidence sources. Six sources were grounded in PubMed or general online content, and the last source was grounded in the Atropos Alexandria library of custom real-world analyses. We found that the general purpose LLMs grounded in public information varied greatly in the answers they returned, even when those answers were sourced from the same publication. Using an ensemble approach, we observed that 49% of the time, two or more LLMs agreed on an answer. Combined, the ensemble approach and the Alexandria custom built source enabled reliable answers to over 64% of biomedical queries. As LLMs become increasingly capable of summarizing scientific content, maximizing their value will require systems that can accurately retrieve both published and custom-generated evidence or generate reliable evidence in real time.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-1\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EBackground\u003C\/h2\u003E\u003Cp id=\u0022p-14\u0022\u003EEvidence-based medicine\u2014making clinical decisions based on the best available research\u2014has been the standard of care for over three decades\u003Csup\u003E\u003Ca id=\u0022xref-ref-1-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-1\u0022\u003E1\u003C\/a\u003E\u003C\/sup\u003E. However, in some specialties, fewer than 20% of daily medical decisions are supported by high-quality evidence\u003Csup\u003E\u003Ca id=\u0022xref-ref-2-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-2\u0022\u003E2\u003C\/a\u003E\u003C\/sup\u003E. This gap arises primarily from two challenges: First, clinical trials often lack generalizability to real-world patients, especially those with complex comorbidities who are frequently excluded from study populations\u003Csup\u003E\u003Ca id=\u0022xref-ref-3-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-3\u0022\u003E3\u003C\/a\u003E\u003C\/sup\u003E. Second, even when multiple relevant studies exist, their findings may conflict due to heterogeneity in patient populations, variable study quality, and inconsistent endpoints and difficulty for the care provider to access the evidence\u003Csup\u003E\u003Ca id=\u0022xref-ref-4-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-4\u0022\u003E4\u003C\/a\u003E\u003C\/sup\u003E. These limitations hinder the synthesis of clear, actionable recommendations for individual patients, leading clinicians to rely heavily on summarized evidence from trusted sources\u003Csup\u003E\u003Ca id=\u0022xref-ref-5-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-5\u0022\u003E5\u003C\/a\u003E\u003C\/sup\u003E.\u003C\/p\u003E\u003Cp id=\u0022p-15\u0022\u003ELarge language models (LLMs) are increasingly being explored for biomedical applications, including literature summarization and natural language question answering\u003Csup\u003E\u003Ca id=\u0022xref-ref-6-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-6\u0022\u003E6\u003C\/a\u003E\u2013\u003Ca id=\u0022xref-ref-8-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-8\u0022\u003E8\u003C\/a\u003E\u003C\/sup\u003E. LLMs have demonstrated impressive capabilities in extracting and synthesizing biomedical information, but they are also prone to hallucinating sources, fabricating citations, or generating responses that deviate from established clinical guidelines\u003Csup\u003E\u003Ca id=\u0022xref-ref-9-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-9\u0022\u003E9\u003C\/a\u003E\u2013\u003Ca id=\u0022xref-ref-11-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-11\u0022\u003E11\u003C\/a\u003E\u003C\/sup\u003E. Furthermore, slight changes in question structure can reduce the accuracy of LLMs on commonly measured clinical tasks\u003Csup\u003E\u003Ca id=\u0022xref-ref-12-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-12\u0022\u003E12\u003C\/a\u003E\u003C\/sup\u003E. These shortcomings present risks in domains where accuracy and reliability is critical. Despite these concerns, LLM integration into biomedical research and clinical workflows has accelerated markedly in recent years. If thoughtful care into measuring accuracy and error rates is not performed now it is possible future high-profile mistakes will shake trust in the medical application of this promising technology.\u003C\/p\u003E\u003Cp id=\u0022p-16\u0022\u003EOne emerging use case is the use of LLMs to generate evidence summaries to support clinical decision-making. Several commercial services\u2014such as Open Evidence, System, Consensus, SciSummary, Perplexity, and others\u2014now offer LLM-powered interfaces to biomedical literature \u003Csup\u003E\u003Ca id=\u0022xref-ref-13-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-13\u0022\u003E13\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-14-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-14\u0022\u003E14\u003C\/a\u003E\u003C\/sup\u003E. While adoption of these tools is increasing, questions remain about how to evaluate their reliability and trustworthiness. Frameworks like the recently proposed MedHELM \u003Csup\u003E\u003Ca id=\u0022xref-ref-15-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-15\u0022\u003E15\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-16-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-16\u0022\u003E16\u003C\/a\u003E\u003C\/sup\u003E aim to standardize the evaluation of LLM outputs across tasks, but they do not yet assess whether responses are grounded in verifiable biomedical evidence.\u003C\/p\u003E\u003Cp id=\u0022p-17\u0022\u003EIn this study, we introduce \u003Cem\u003EAnswered with Evidence\u003C\/em\u003E, a structured methodology for evaluating the evidentiary grounding and citation fidelity of LLM-generated answers to biomedical questions. Our approach emphasizes verifiability against trusted biomedical sources, enabling the development and monitoring of systems suitable for clinical decision support and real-world evidence generation. To assess the utility of this framework, we analyzed nearly three thousand physician-submitted questions to Atropos Health\u2019s Green Button Service \u003Csup\u003E\u003Ca id=\u0022xref-ref-8-2\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-8\u0022\u003E8\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-17-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-17\u0022\u003E17\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-18-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-18\u0022\u003E18\u003C\/a\u003E\u003C\/sup\u003E\u2014 a human-in-the-loop, real-world evidence platform used by clinicians, hospital leaders, and researchers. Answers were compared across 7 LLMs: Three PubMed-based retrieval-augmented systems (System, Perplexity, and Claude), Open AI (o3 and GPT-5) grounded in web search preview, Gemini grounded in Google search, and Alexandria, the Atropos Evidence Library, a curated collection of real-world evidence derived from prior medical inquiries.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-2\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EMaterials and Methods\u003C\/h2\u003E\u003Cp id=\u0022p-18\u0022\u003E\u003Ca id=\u0022xref-fig-1-1\u0022 class=\u0022xref-fig\u0022 href=\u0022#F1\u0022\u003EFigure 1\u003C\/a\u003E outlines the overall analysis workflow. We began by selecting a sample of 2,942 questions submitted to Atropos Health between 2022 and 2025. These questions originated from physicians seeking evidence to inform clinical decisions and from researchers evaluating treatment efficacy or event rates in defined populations. The sample spans all major clinical subspecialties and includes a diverse range of query types\u2014from causal inference questions related to adverse events and treatment comparisons to more straightforward questions about prevalence and incidence.\u003C\/p\u003E\u003Cdiv id=\u0022F1\u0022 class=\u0022fig pos-float type-figure  odd\u0022\u003E\u003Cdiv class=\u0022highwire-figure\u0022\u003E\u003Cdiv class=\u0022fig-inline-img-wrapper\u0022\u003E\u003Cdiv class=\u0022fig-inline-img\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F1.large.jpg?width=800\u0026amp;height=600\u0026amp;carousel=1\u0022 title=\u0022\u0026#x2013; Evidence Badge Generation Workflow \u0022 class=\u0022highwire-fragment fragment-images colorbox-load\u0022 rel=\u0022gallery-fragment-images-518782870\u0022 data-figure-caption=\u0022\u0026lt;div class=\u0026quot;highwire-markup\u0026quot;\u0026gt;\u0026lt;span xmlns=\u0026quot;http:\/\/www.w3.org\/1999\/xhtml\u0026quot; class=\u0026quot;caption-title\u0026quot;\u0026gt;\u0026#x2013; Evidence Badge Generation Workflow\u0026lt;\/span\u0026gt; \u0026lt;\/div\u0026gt;\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003E\u003Cspan class=\u0022hw-responsive-img\u0022\u003E\u003Cimg class=\u0022highwire-fragment fragment-image lazyload\u0022 alt=\u0022Figure 1\u0022 src=\u0022data:image\/gif;base64,R0lGODlhAQABAIAAAAAAAP\/\/\/yH5BAEAAAAALAAAAAABAAEAAAIBRAA7\u0022 data-src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F1.medium.gif\u0022 width=\u0022440\u0022 height=\u0022138\u0022\/\u003E\u003Cnoscript\u003E\u003Cimg class=\u0022highwire-fragment fragment-image\u0022 alt=\u0022Figure 1\u0022 src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F1.medium.gif\u0022 width=\u0022440\u0022 height=\u0022138\u0022\/\u003E\u003C\/noscript\u003E\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cul class=\u0022highwire-figure-links inline\u0022\u003E\u003Cli class=\u0022download-fig first\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F1.large.jpg?download=true\u0022 class=\u0022highwire-figure-link highwire-figure-link-download\u0022 title=\u0022Download Figure 1\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload figure\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022new-tab last\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F1.large.jpg\u0022 class=\u0022highwire-figure-link highwire-figure-link-newtab\u0022 target=\u0022_blank\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EOpen in new tab\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003Cdiv class=\u0022fig-caption\u0022 xmlns:xhtml=\u0022http:\/\/www.w3.org\/1999\/xhtml\u0022\u003E\u003Cspan class=\u0022fig-label\u0022\u003EFigure 1\u003C\/span\u003E \u003Cspan class=\u0022caption-title\u0022\u003E\u2013 Evidence Badge Generation Workflow\u003C\/span\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cp id=\u0022p-19\u0022\u003EEach question was processed on an LLM with access to the different underlying evidence sources mentioned above. Once the response was obtained, it was evaluated for being based in evidence and then based on the evaluation a \u201cbadge\u201d was assigned to ease in user interpretation.\u003C\/p\u003E\u003Cdiv id=\u0022sec-3\u0022 class=\u0022subsection\u0022\u003E\u003Ch3\u003EEvidence Sources\u003C\/h3\u003E\u003Cp id=\u0022p-20\u0022\u003EWe evaluated biomedical question-answering systems using seven distinct evidence sources, each optimized for different types of clinical inquiries. The first three sources\u2014System Inc\u003Csup\u003E\u003Ca id=\u0022xref-ref-14-2\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-14\u0022\u003E14\u003C\/a\u003E\u003C\/sup\u003E, Claude (Opus 4)\u003Csup\u003E\u003Ca id=\u0022xref-ref-19-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-19\u0022\u003E19\u003C\/a\u003E\u003C\/sup\u003E, and Perplexity (Sonar-deep-research) \u003Csup\u003E\u003Ca id=\u0022xref-ref-13-2\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-13\u0022\u003E13\u003C\/a\u003E\u003C\/sup\u003E\u2014are retrieval-augmented generation\u003Csup\u003E\u003Ca id=\u0022xref-ref-20-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-20\u0022\u003E20\u003C\/a\u003E\u003C\/sup\u003E (RAG) platforms grounded in the PubMed corpus, comprising peer-reviewed biomedical literature that reflects the current state of scientific knowledge. Perplexity and Claude, while designed as general-purpose LLM-based question-answering tools, were configured for this analysis to retrieve only from academic publications. SystemAI combines large language models with graph-based retrieval technologies, trained specifically on scientific literature using state-of-the-art models.\u003C\/p\u003E\u003Cp id=\u0022p-21\u0022\u003EThree other LLMs OpenAI (o3 and GPT-5), and Gemini (2.5 Flash) are general-purpose LLMs trained on a large corpus of available information via web search tools (google search, specifically in the case for Gemini). Despite their general purpose nature, they have gained traction for healthcare uses and previous iterations of each model have been scored on medical tasks via the MedHELM framework (performance available at: \u003Ca href=\u0022https:\/\/crfm.stanford.edu\/helm\/medhelm\/latest\/\u0022\u003Ehttps:\/\/crfm.stanford.edu\/helm\/medhelm\/latest\/\u003C\/a\u003E).\u003C\/p\u003E\u003Cp id=\u0022p-22\u0022\u003EThe final evidence source is Alexandria, the Atropos Evidence Library, a proprietary collection of structured real-world evidence (RWE). This library includes studies generated from electronic health records, open and closed claims data, and specialized clinical datasets in response to specific physician and researcher inquiries. Each study includes a physician-written summary and clear description of the study methods, describing the study population, arm assignment, baseline characteristics, and outcomes of interest.\u003C\/p\u003E\u003Cp id=\u0022p-23\u0022\u003ECollectively, these 7 models provide a comprehensive basis for evaluating the correctness, evidence alignment, and clinical relevance of LLM-generated answers. For six of the sources, all of the nearly 3,000 questions were evaluated. A subset of 1,739 questions was randomly selected for evaluation using the Perplexity platform. This subset was chosen to balance computational cost and runtime constraints while maintaining sufficient diversity to represent the broader range of biomedical queries.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv id=\u0022sec-4\u0022 class=\u0022subsection\u0022\u003E\u003Ch3\u003EEvidence Evaluation\u003C\/h3\u003E\u003Cp id=\u0022p-24\u0022\u003EWe apply a structured evaluation rubric composed of three binary (True\/False) criteria. Each criterion isolates a specific dimension of answer quality with respect to its contextual support.\u003C\/p\u003E\u003Cdiv id=\u0022T1\u0022 class=\u0022table pos-float\u0022\u003E\u003Cdiv class=\u0022table-inline table-callout-links\u0022\u003E\u003Cdiv class=\u0022callout\u0022\u003E\u003Cspan\u003EView this table:\u003C\/span\u003E\u003Cul class=\u0022callout-links\u0022\u003E\u003Cli class=\u0022view-inline first\u0022\u003E\u003Ca href=\u0022\u0022 class=\u0022table-expand-inline\u0022 data-table-url=\u0022\/highwire\/markup\/1058819\/expansion?postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0026amp;table-expand-inline=1\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView inline\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022view-popup\u0022\u003E\u003Ca href=\u0022\/highwire\/markup\/1058819\/expansion?width=1000\u0026amp;height=500\u0026amp;iframe=true\u0026amp;postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0022 class=\u0022colorbox colorbox-load table-expand-popup\u0022 rel=\u0022gallery-fragment-tables\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView popup\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022download-ppt last\u0022\u003E\u003Ca href=\u0022\/highwire\/powerpoint\/1058819\u0022 class=\u0022highwire-figure-link highwire-figure-link-ppt\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload powerpoint\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cp id=\u0022p-25\u0022\u003EOnce the appropriate context is retrieved and an AI-generated answer returned, we use a structured prompt to judge the answers\u2019 relevance and grounding. This evaluation assesses how well the AI-generated answer responds to the original question, given only the retrieved context (Full prompt details available in Supplemental Figure S1)\u003C\/p\u003E\u003Cp id=\u0022p-26\u0022\u003ETo simplify interpretation, each evaluated question-answer pair is assigned a color-coded Answered with Evidence badge based on the boolean fields from the structured prompt output. An example of the evaluation of a question-response context and badge assignment is shown in \u003Ca id=\u0022xref-fig-2-1\u0022 class=\u0022xref-fig\u0022 href=\u0022#F2\u0022\u003EFigure 2\u003C\/a\u003E.\u003C\/p\u003E\u003Cdiv id=\u0022F2\u0022 class=\u0022fig pos-float type-figure  odd\u0022\u003E\u003Cdiv class=\u0022highwire-figure\u0022\u003E\u003Cdiv class=\u0022fig-inline-img-wrapper\u0022\u003E\u003Cdiv class=\u0022fig-inline-img\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F2.large.jpg?width=800\u0026amp;height=600\u0026amp;carousel=1\u0022 title=\u0022\u0026#x2013; Example Context Evaluation and Badge Assignment \u0022 class=\u0022highwire-fragment fragment-images colorbox-load\u0022 rel=\u0022gallery-fragment-images-518782870\u0022 data-figure-caption=\u0022\u0026lt;div class=\u0026quot;highwire-markup\u0026quot;\u0026gt;\u0026lt;span xmlns=\u0026quot;http:\/\/www.w3.org\/1999\/xhtml\u0026quot; class=\u0026quot;caption-title\u0026quot;\u0026gt;\u0026#x2013; Example Context Evaluation and Badge Assignment\u0026lt;\/span\u0026gt; \u0026lt;\/div\u0026gt;\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003E\u003Cspan class=\u0022hw-responsive-img\u0022\u003E\u003Cimg class=\u0022highwire-fragment fragment-image lazyload\u0022 alt=\u0022Figure 2\u0022 src=\u0022data:image\/gif;base64,R0lGODlhAQABAIAAAAAAAP\/\/\/yH5BAEAAAAALAAAAAABAAEAAAIBRAA7\u0022 data-src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F2.medium.gif\u0022 width=\u0022440\u0022 height=\u0022258\u0022\/\u003E\u003Cnoscript\u003E\u003Cimg class=\u0022highwire-fragment fragment-image\u0022 alt=\u0022Figure 2\u0022 src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F2.medium.gif\u0022 width=\u0022440\u0022 height=\u0022258\u0022\/\u003E\u003C\/noscript\u003E\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cul class=\u0022highwire-figure-links inline\u0022\u003E\u003Cli class=\u0022download-fig first\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F2.large.jpg?download=true\u0022 class=\u0022highwire-figure-link highwire-figure-link-download\u0022 title=\u0022Download Figure 2\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload figure\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022new-tab last\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F2.large.jpg\u0022 class=\u0022highwire-figure-link highwire-figure-link-newtab\u0022 target=\u0022_blank\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EOpen in new tab\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003Cdiv class=\u0022fig-caption\u0022\u003E\u003Cspan class=\u0022fig-label\u0022\u003EFigure 2\u003C\/span\u003E \u003Cspan class=\u0022caption-title\u0022\u003E\u2013 Example Context Evaluation and Badge Assignment\u003C\/span\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv id=\u0022T2\u0022 class=\u0022table pos-float\u0022\u003E\u003Cdiv class=\u0022table-inline table-callout-links\u0022\u003E\u003Cdiv class=\u0022callout\u0022\u003E\u003Cspan\u003EView this table:\u003C\/span\u003E\u003Cul class=\u0022callout-links\u0022\u003E\u003Cli class=\u0022view-inline first\u0022\u003E\u003Ca href=\u0022\u0022 class=\u0022table-expand-inline\u0022 data-table-url=\u0022\/highwire\/markup\/1058824\/expansion?postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0026amp;table-expand-inline=1\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView inline\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022view-popup last\u0022\u003E\u003Ca href=\u0022\/highwire\/markup\/1058824\/expansion?width=1000\u0026amp;height=500\u0026amp;iframe=true\u0026amp;postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0022 class=\u0022colorbox colorbox-load table-expand-popup\u0022 rel=\u0022gallery-fragment-tables\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView popup\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cp id=\u0022p-27\u0022\u003EThis logic provides a quick way to assess the quality and reliability of evidence grounding in biomedical question-answer responses. The badge system is designed to classify the factual alignment of AI-generated answers and signal the evidence landscape surrounding a biomedical question. The green badge indicates a high-confidence response. These answers represent areas of well-established evidence where the AI-generated answer is effectively synthesizing known information. The yellow badge indicates the context is relevant to the question, and the answer is grounded in it, but the context does not directly answer the question. It reflects situations where indirect evidence or background knowledge exists, but no study has yet addressed the specific question. This marks the evidence gap and the opportunity to generate a novel study. The red badge indicates the context is not related, the answer introduces hallucinated content, or both. It represents a low-confidence response.\u003C\/p\u003E\u003Cp id=\u0022p-28\u0022\u003EIn addition to the badging, each LLM was instructed to provide a reference to the document\/publication where the answer was pulled, as well as what text within the reference material is the basis for the answer. These references were manually verified to be non-hallucinated, and the snippet of interest was manually verified to exist within the document itself.\u003C\/p\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-5\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EResults\u003C\/h2\u003E\u003Cdiv id=\u0022sec-6\u0022 class=\u0022subsection\u0022\u003E\u003Ch3\u003EEvidence Criterion Assessment and Answered with Evidence Badge assignment across evidence sources\u003C\/h3\u003E\u003Cp id=\u0022p-29\u0022\u003EAll questions were submitted to the seven evaluated evidence sources, and each response was assessed based on the criteria described in the Evidence Evaluation section. A summary of the badge assignment for the three evidence sources can be found on \u003Ca id=\u0022xref-table-wrap-3-1\u0022 class=\u0022xref-table\u0022 href=\u0022#T3\u0022\u003ETable 1\u003C\/a\u003E. For the PubMed-based sources, the System platform produced high-confidence, evidence-grounded responses (green badge) for 44.6% of queries. Perplexity, when restricted to academic literature, achieved green-badged responses for 21.3% of cases, and Claude with a similar restriction, had a green badge 29.1% of the time. For the general-purpose LLMs a green badge was assigned in Gemini 45.2% of the time, OpenAI o3 71% of the time, and GPT-5 67.1% of the time. The higher rate of green badge assignment in the general-purpose LLMs was a surprising result that caused us to evaluate the reference document and reference snippet that supported the finding (see Intersouce Agreement for Evidence Badge Assignment) The remaining responses from these sources were assigned Yellow or Red badges, indicating that either the answer lacked sufficient evidence grounding (Yellow) or was irrelevant to the original question (Red). For full details, see table S1.\u003C\/p\u003E\u003Cdiv id=\u0022T3\u0022 class=\u0022table pos-float\u0022\u003E\u003Cdiv class=\u0022table-inline table-callout-links\u0022\u003E\u003Cdiv class=\u0022callout\u0022\u003E\u003Cspan\u003EView this table:\u003C\/span\u003E\u003Cul class=\u0022callout-links\u0022\u003E\u003Cli class=\u0022view-inline first\u0022\u003E\u003Ca href=\u0022\u0022 class=\u0022table-expand-inline\u0022 data-table-url=\u0022\/highwire\/markup\/1058818\/expansion?postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0026amp;table-expand-inline=1\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView inline\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022view-popup last\u0022\u003E\u003Ca href=\u0022\/highwire\/markup\/1058818\/expansion?width=1000\u0026amp;height=500\u0026amp;iframe=true\u0026amp;postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0022 class=\u0022colorbox colorbox-load table-expand-popup\u0022 rel=\u0022gallery-fragment-tables\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView popup\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv class=\u0022table-caption\u0022\u003E\u003Cspan class=\u0022table-label\u0022\u003ETable 1\u003C\/span\u003E \u003Cspan class=\u0022caption-title\u0022\u003E\u2013 Answered with evidence badge summary across evidence sources.\u003C\/span\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cp id=\u0022p-30\u0022\u003EIn comparison, Alexandria, the Atropos Evidence Library, which generates responses using structured real-world evidence from EHR, claims, and other clinical datasets, produced Green-badged responses for 50.1% of the submitted questions. The remaining 49.9% were rated Yellow or Red, typically due to limitations in available real-world data or ambiguity in the question framing.\u003C\/p\u003E\u003Cp id=\u0022p-31\u0022\u003EThese findings suggest that novel real-world evidence sources may provide comparable or improved grounding relative to PubMed-based and general web search retrieval systems, particularly for complex or underrepresented clinical scenarios.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv id=\u0022sec-7\u0022 class=\u0022subsection\u0022\u003E\u003Ch3\u003EIntersource agreement for Evidence Badge assignment\u003C\/h3\u003E\u003Cp id=\u0022p-32\u0022\u003ETo assess the consistency of evidence grounding, we compared badge assignments, references provided by LLM, and snippet of supporting evidence from the different evidence sources. Our hypothesis was that the Pubmed-base sources (System, Claude, and Perplexity) would show a high concordance of badge assignments, that the web-search based models (Open AI and Gemini) would have the highest percentage of green-badges, however some citations originating from non-relieable sources, and the custom real-world evidence source (Alexandria) would have the most novel answers that could not be answered by the other sources. Within each group, we anticipated only partial agreement due to differences in retrieval mechanisms and response generation strategies.\u003C\/p\u003E\u003Cp id=\u0022p-33\u0022\u003EIn comparing responses that obtained a Green badge (found to be answered with evidence) the highest agreement between sources was between Atropos and OpenAI (\u003Ca id=\u0022xref-table-wrap-4-1\u0022 class=\u0022xref-table\u0022 href=\u0022#T4\u0022\u003ETable 2\u003C\/a\u003E; 37.39%). The lowest agreement in Green badge assignment was between Perplexity and Claude (5.5%). In both cases, the agreement is driven by the percent of questions that received the green badge for each source; Atropos and Open AI have the most green badges, and Perplexity and Claude having the fewest. For a full breakdown of pairwise\/global intersource badge agreement on Yellow and Red badges, please see table S2 and S3. When considering all sources, 88% of all submitted questions were able to return a response that received a green badge.\u003C\/p\u003E\u003Cdiv id=\u0022T4\u0022 class=\u0022table pos-float\u0022\u003E\u003Cdiv class=\u0022table-inline table-callout-links\u0022\u003E\u003Cdiv class=\u0022callout\u0022\u003E\u003Cspan\u003EView this table:\u003C\/span\u003E\u003Cul class=\u0022callout-links\u0022\u003E\u003Cli class=\u0022view-inline first\u0022\u003E\u003Ca href=\u0022\u0022 class=\u0022table-expand-inline\u0022 data-table-url=\u0022\/highwire\/markup\/1058825\/expansion?postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0026amp;table-expand-inline=1\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView inline\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022view-popup\u0022\u003E\u003Ca href=\u0022\/highwire\/markup\/1058825\/expansion?width=1000\u0026amp;height=500\u0026amp;iframe=true\u0026amp;postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0022 class=\u0022colorbox colorbox-load table-expand-popup\u0022 rel=\u0022gallery-fragment-tables\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView popup\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022download-ppt last\u0022\u003E\u003Ca href=\u0022\/highwire\/powerpoint\/1058825\u0022 class=\u0022highwire-figure-link highwire-figure-link-ppt\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload powerpoint\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv class=\u0022table-caption\u0022\u003E\u003Cspan class=\u0022table-label\u0022\u003ETable 2\u003C\/span\u003E \u003Cspan class=\u0022caption-title\u0022\u003E\u2013 Pairwise agreement between different evidence sources\u003C\/span\u003E\u003Cp id=\u0022p-34\u0022 class=\u0022first-child\u0022\u003EEvery questionw as submitted to each LLM and the output was evaluated with the Answered with evidence framework. For each evidence source a pairwise agreement was calculated for Green Badges (Shown) and Red\/Yellow (extended table S1). The highest agreement that question could be answered with evidence was between Atropos\/OpenAI.\u003C\/p\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cp id=\u0022p-35\u0022\u003EThe high variability between green badges in different evidence sources trained on theoretically similar sources was surprising to us. To explore why this was the case we explored the citation returned by the LLM describing where the evidence was sourced as well as the snippet identified as containing the evidence. This cross-model deep evaluation was performed on 100 questions, limited to Claude, Perplexity, Open AI, and Gemini all which make retrieval of the source URL possible (\u003Ca id=\u0022xref-table-wrap-5-1\u0022 class=\u0022xref-table\u0022 href=\u0022#T5\u0022\u003ETable 3\u003C\/a\u003E). We identified the the highest similarity of source was between Claude\/Perplexity at 53%. Given that both can be limited to only utilize Pubmed, the fact they had the highest agreement is to be expected but only 53% agreement was surprising. On the other side we found no agreement across the sample between OpenAI and Gemini in the referenced document. When two our more sources referenced the same document, we evaluated similarity between snippets and found different statements from the same article serving as reference.\u003C\/p\u003E\u003Cdiv id=\u0022T5\u0022 class=\u0022table pos-float\u0022\u003E\u003Cdiv class=\u0022table-inline table-callout-links\u0022\u003E\u003Cdiv class=\u0022callout\u0022\u003E\u003Cspan\u003EView this table:\u003C\/span\u003E\u003Cul class=\u0022callout-links\u0022\u003E\u003Cli class=\u0022view-inline first\u0022\u003E\u003Ca href=\u0022\u0022 class=\u0022table-expand-inline\u0022 data-table-url=\u0022\/highwire\/markup\/1058821\/expansion?postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0026amp;table-expand-inline=1\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView inline\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022view-popup\u0022\u003E\u003Ca href=\u0022\/highwire\/markup\/1058821\/expansion?width=1000\u0026amp;height=500\u0026amp;iframe=true\u0026amp;postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0022 class=\u0022colorbox colorbox-load table-expand-popup\u0022 rel=\u0022gallery-fragment-tables\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView popup\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022download-ppt last\u0022\u003E\u003Ca href=\u0022\/highwire\/powerpoint\/1058821\u0022 class=\u0022highwire-figure-link highwire-figure-link-ppt\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload powerpoint\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv class=\u0022table-caption\u0022\u003E\u003Cspan class=\u0022table-label\u0022\u003ETable 3\u003C\/span\u003E \u003Cspan class=\u0022caption-title\u0022\u003E\u2013 Cited Source agreement across evidence sources\u003C\/span\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cp id=\u0022p-36\u0022\u003EGiven the high variability in the referenced documentation and the snippets used for supporting the LLM response, we evaluated how often one or more LLMs had a green badge. For the non-custom-RWE evidence sources, at least one gave a Green badge 81% of the time but this dropped to 49% when we required two or more LLMs to have a green badge, and 25% when requiring 3 ore more LLMs to achieve consensus of an answer being grounded in evidence.\u003C\/p\u003E\u003Cp id=\u0022p-37\u0022\u003EAdding to the generalized LLMs the custom RWE source (Alexandria) we find that we get 2 or more green badged responses 64% of the time and 3 or more 38% of the time.\u003C\/p\u003E\u003Cp id=\u0022p-38\u0022\u003ETo assess each source\u2019s unique contribution, we also measured \u003Cem\u003Enovelty\u003C\/em\u003E\u2014defined as the proportion of questions where only one source produced a Green-badged response, while the others returned Yellow or Red. Novelty rates were 14.0% for Open AI, 7.6% for Alexandria, 1.8% for Gemini, and less than 1% for Perplexity, Claude, and System. These results suggest that real-world evidence sources and general-purpose LLM systems each provide distinct and valuable contributions to biomedical question answering.\u003C\/p\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-8\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EDiscussion\u003C\/h2\u003E\u003Cp id=\u0022p-39\u0022\u003EOne of the enduring challenges in clinical care and health policy is the ability to access evidence that directly addresses the question at hand\u003Csup\u003E\u003Ca id=\u0022xref-ref-21-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-21\u0022\u003E21\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-22-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-22\u0022\u003E22\u003C\/a\u003E\u003C\/sup\u003E. Despite the widespread adoption of evidence-based medicine, physicians and decision-makers often face a gap between available evidence and real-world information needs. In part, this challenge stems from the sheer volume and fragmentation of biomedical literature, which far exceeds the capacity of any individual to comprehensively access, evaluate, and synthesize to ground every decision in the latest evidence\u003Csup\u003E\u003Ca id=\u0022xref-ref-2-2\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-2\u0022\u003E2\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-4-2\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-4\u0022\u003E4\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-5-2\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-5\u0022\u003E5\u003C\/a\u003E\u003C\/sup\u003E.\u003C\/p\u003E\u003Cp id=\u0022p-40\u0022\u003EThe emergence of large language models (LLMs) with capabilities in literature retrieval and summarization offers a promising path forward\u003Csup\u003E\u003Ca id=\u0022xref-ref-6-2\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-6\u0022\u003E6\u003C\/a\u003E\u003C\/sup\u003E. However, even with accurate identification and synthesis of relevant publications, there remains a persistent evidence gap\u2014many questions simply fall outside the scope of existing published studies. Bridging this gap requires not only tools to extract and summarize existing literature, but also systems that can surface or generate novel real-world evidence in response to specific clinical or research queries\u003Csup\u003E\u003Ca id=\u0022xref-ref-17-2\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-17\u0022\u003E17\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-18-2\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-18\u0022\u003E18\u003C\/a\u003E\u003C\/sup\u003E.\u003C\/p\u003E\u003Cp id=\u0022p-41\u0022\u003EIn this study, we introduced \u003Cem\u003EAnswered with Evidence\u003C\/em\u003E, a framework for evaluating whether LLM-generated responses are (1) relevant, (2) directly responsive to the question, and (3) grounded in evidence. Each response is scored across these criteria and summarized using an intuitive traffic light\u2013style badge system\u2014Green (high confidence and evidence-based), Yellow (partial or uncertain grounding), and Red (unsupported or irrelevant). This system provides users with rapid, interpretable feedback on the reliability of an answer.\u003C\/p\u003E\u003Cp id=\u0022p-42\u0022\u003EAcross the six general-purpose or literature-grounded LLMs, Open AI\u2019s o3 and GPT-5 models generated the highest rate of Green-badged responses (70.1% and 67.1% respectively), compared to between 21% and 45% for the other models evaluated. Notably, despite all models being grounded in Pubmed\/web search they exhibited markedly different performance profiles. The discrepancy in Green badge rates and novelty between these systems suggests that training data alone does not fully explain differences in response quality. Architecture, retrieval mechanisms, response-generation, sentence structure, and word use also likely play a significant role. Given that these models have such a high variability in the evaluation, we looked closer at the document referenced as the source of truth and the snippet within the document that the LLM surfaced as the grounding for its answer. This evaluation demonstrated that there was high variability between the documents selected as references. The highest agreement between any two sources was 53% (Claude and Perplexity), with no identified document overlap between OpenAI and Gemini.\u003C\/p\u003E\u003Cp id=\u0022p-43\u0022\u003EThis high variability in the reference document suggests that no single publication-based model can be trusted alone. Missing one or two critical manuscripts about a given clinical scenario would result in a confidently worded but ultimately incorrect and likely dangerous answer.\u003C\/p\u003E\u003Cp id=\u0022p-44\u0022\u003EInstead, building consensus from identifying the same answer surfaced from multiple LLMs is critical. This finding is supported by other such cross-LLM comparisons where utilization of LLM-as-jury has been utilized to find the consensus answer\u003Csup\u003E\u003Ca id=\u0022xref-ref-23-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-23\u0022\u003E23\u003C\/a\u003E\u003C\/sup\u003E. We similarly take an ensemble approach where a single question is considered sufficiently answered by an LLM only if two or more LLMs are evaluated to have a green badge signifying the response is grounded in evidence. Using this methodology 49% of all questions had a component of the question answered with well-grounded published evidence. When adding in the custom-built RWE to answer such questions, the combined sources can answer nearly 64% of questions of interest to physicians. These findings underscore the value of combining both published and real-world evidence in biomedical question answering.\u003C\/p\u003E\u003Cp id=\u0022p-45\u0022\u003EAssuming continued improvements in LLM retrieval fidelity and hallucination reduction, we expect PubMed-based systems to eventually converge toward similar badge distributions\u2014potentially reaching a ceiling of around 55% green-badge assignment by 2 or more LLMs. In this context, the ability to access or generate \u003Cem\u003Enovel\u003C\/em\u003E evidence becomes essential. In our analysis, supplementing general-purpose LLMs with Alexandria increased the proportion of high-confidence responses by an additional 15% to the ensemble approach, demonstrating the unique value of real-world evidence in addressing unanswered clinical questions (\u003Ca id=\u0022xref-fig-3-1\u0022 class=\u0022xref-fig\u0022 href=\u0022#F3\u0022\u003EFigure 3\u003C\/a\u003E).\u003C\/p\u003E\u003Cdiv id=\u0022F3\u0022 class=\u0022fig pos-float type-figure  odd\u0022\u003E\u003Cdiv class=\u0022highwire-figure\u0022\u003E\u003Cdiv class=\u0022fig-inline-img-wrapper\u0022\u003E\u003Cdiv class=\u0022fig-inline-img\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F3.large.jpg?width=800\u0026amp;height=600\u0026amp;carousel=1\u0022 title=\u0022\u0026#x2013; Current Evidence and LLM Capability Synergistic performance A library of custom built RWE to answer questions is able to identify answers to 50% of provider inquiries evaluated. Similarly, an ensemble approach requiring 2 or more general purpose LLMs to produce an evidence grounded answer can produce an answer to physician queries 49% of the time. Combining both approaches over 64% of difficult to answer questions by physicians can be answered with current methodology and evidence.\u0022 class=\u0022highwire-fragment fragment-images colorbox-load\u0022 rel=\u0022gallery-fragment-images-518782870\u0022 data-figure-caption=\u0022\u0026lt;div class=\u0026quot;highwire-markup\u0026quot;\u0026gt;\u0026lt;span xmlns=\u0026quot;http:\/\/www.w3.org\/1999\/xhtml\u0026quot; class=\u0026quot;caption-title\u0026quot;\u0026gt;\u0026#x2013; Current Evidence and LLM Capability Synergistic performance\u0026lt;\/span\u0026gt; A library of custom built RWE to answer questions is able to identify answers to 50% of provider inquiries evaluated. Similarly, an ensemble approach requiring 2 or more general purpose LLMs to produce an evidence grounded answer can produce an answer to physician queries 49% of the time. Combining both approaches over 64% of difficult to answer questions by physicians can be answered with current methodology and evidence.\u0026lt;\/div\u0026gt;\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003E\u003Cspan class=\u0022hw-responsive-img\u0022\u003E\u003Cimg class=\u0022highwire-fragment fragment-image lazyload\u0022 alt=\u0022Figure 3\u0022 src=\u0022data:image\/gif;base64,R0lGODlhAQABAIAAAAAAAP\/\/\/yH5BAEAAAAALAAAAAABAAEAAAIBRAA7\u0022 data-src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F3.medium.gif\u0022 width=\u0022440\u0022 height=\u0022153\u0022\/\u003E\u003Cnoscript\u003E\u003Cimg class=\u0022highwire-fragment fragment-image\u0022 alt=\u0022Figure 3\u0022 src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F3.medium.gif\u0022 width=\u0022440\u0022 height=\u0022153\u0022\/\u003E\u003C\/noscript\u003E\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cul class=\u0022highwire-figure-links inline\u0022\u003E\u003Cli class=\u0022download-fig first\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F3.large.jpg?download=true\u0022 class=\u0022highwire-figure-link highwire-figure-link-download\u0022 title=\u0022Download Figure 3\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload figure\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022new-tab last\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F3.large.jpg\u0022 class=\u0022highwire-figure-link highwire-figure-link-newtab\u0022 target=\u0022_blank\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EOpen in new tab\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003Cdiv class=\u0022fig-caption\u0022\u003E\u003Cspan class=\u0022fig-label\u0022\u003EFigure 3\u003C\/span\u003E \u003Cspan class=\u0022caption-title\u0022\u003E\u2013 Current Evidence and LLM Capability Synergistic performance\u003C\/span\u003E\u003Cp id=\u0022p-46\u0022 class=\u0022first-child\u0022\u003EA library of custom built RWE to answer questions is able to identify answers to 50% of provider inquiries evaluated. Similarly, an ensemble approach requiring 2 or more general purpose LLMs to produce an evidence grounded answer can produce an answer to physician queries 49% of the time. Combining both approaches over 64% of difficult to answer questions by physicians can be answered with current methodology and evidence.\u003C\/p\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cp id=\u0022p-47\u0022\u003EThis study has several limitations. First, only a single evaluation framework and LLM question prompt were utilized across the different LLM responses. As a next step, iteration of both the evaluation framework and the question submission prompt should be performed. Given that all the LLMs have different response structures, it is possible that a different evaluation framework needs to be utilized for each LLM. Second, several emerging LLM-based literature summarization platforms were not included in this initial analysis and warrant future benchmarking. Third, and most critically, these responses are meant to inform clinical decisions, and an evaluation of the response and reference document\/snippet by a panel of physicians will provide a gold label to determine the accuracy of both the budgeting and the ensemble approach.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-9\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EConclusion\u003C\/h2\u003E\u003Cp id=\u0022p-48\u0022\u003EAccessing pertinent and reliable evidence remains a significant challenge for healthcare providers, health system leaders, and biomedical researchers. While large language models (LLMs) offer a powerful means to navigate the vast and expanding body of published literature, our findings demonstrate that, even with advanced retrieval and summarization capabilities, approximately 50% of biomedical questions remain inadequately addressed using published sources alone. Similarly, a real-world evidence (RWE) library specifically designed to address gaps in the literature still left nearly half of the questions unanswered. However, when combined, these complementary evidence sources enabled high-confidence answers for nearly two-thirds of clinician\u2013 and researcher-submitted inquiries.\u003C\/p\u003E\u003Cp id=\u0022p-49\u0022\u003EThese findings highlight a key insight: advancing biomedical question answering will require more than improved retrieval of existing literature\u2014it will also require the generation and integration of new evidence generated with the same methodological rigor required for peer-review. To realize the full potential of LLMs in clinical and research workflows, investment in scalable, structured real-world evidence generation will be as important as continued advances in model architecture and prompt engineering.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section data-availability\u0022 id=\u0022sec-10\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EData Availability\u003C\/h2\u003E\u003Cp id=\u0022p-50\u0022\u003EAll data produced in the present study are available upon reasonable request to the authors.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-11\u0022\u003E\u003Ch2 class=\u0022\u0022\u003ESupplement\u003C\/h2\u003E\u003Cdiv id=\u0022F4\u0022 class=\u0022fig pos-float type-figure  odd\u0022\u003E\u003Cdiv class=\u0022highwire-figure\u0022\u003E\u003Cdiv class=\u0022fig-inline-img-wrapper\u0022\u003E\u003Cdiv class=\u0022fig-inline-img\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F4\/graphic-11.large.jpg?width=800\u0026amp;height=600\u0026amp;carousel=1\u0022 title=\u0022Figure S1: \u0022 class=\u0022highwire-fragment fragment-images colorbox-load\u0022 rel=\u0022gallery-fragment-images-518782870\u0022 data-figure-caption=\u0022\u0026lt;div class=\u0026quot;highwire-markup\u0026quot;\u0026gt;\u0026lt;span xmlns=\u0026quot;http:\/\/www.w3.org\/1999\/xhtml\u0026quot; class=\u0026quot;caption-title\u0026quot;\u0026gt;Figure S1:\u0026lt;\/span\u0026gt; \u0026lt;\/div\u0026gt;\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003E\u003Cspan class=\u0022hw-responsive-img\u0022\u003E\u003Cimg class=\u0022highwire-fragment fragment-image lazyload\u0022 alt=\u0022Figure\u0022 src=\u0022data:image\/gif;base64,R0lGODlhAQABAIAAAAAAAP\/\/\/yH5BAEAAAAALAAAAAABAAEAAAIBRAA7\u0022 data-src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F4\/graphic-11.medium.gif\u0022 width=\u0022440\u0022 height=\u0022244\u0022\/\u003E\u003Cnoscript\u003E\u003Cimg class=\u0022highwire-fragment fragment-image\u0022 alt=\u0022Figure\u0022 src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F4\/graphic-11.medium.gif\u0022 width=\u0022440\u0022 height=\u0022244\u0022\/\u003E\u003C\/noscript\u003E\u003C\/span\u003E\u003C\/a\u003E\u003Cul class=\u0022highwire-figure-links inline\u0022\u003E\u003Cli class=\u0022download-fig first\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F4\/graphic-11.large.jpg?download=true\u0022 class=\u0022highwire-figure-link highwire-figure-link-download\u0022 title=\u0022Download \u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload figure\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022new-tab last\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F4\/graphic-11.large.jpg\u0022 class=\u0022highwire-figure-link highwire-figure-link-newtab\u0022 target=\u0022_blank\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EOpen in new tab\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003Cdiv class=\u0022fig-inline-img\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F4\/graphic-12.large.jpg?width=800\u0026amp;height=600\u0026amp;carousel=1\u0022 title=\u0022Figure S1: \u0022 class=\u0022highwire-fragment fragment-images colorbox-load\u0022 rel=\u0022gallery-fragment-images-518782870\u0022 data-figure-caption=\u0022\u0026lt;div class=\u0026quot;highwire-markup\u0026quot;\u0026gt;\u0026lt;span xmlns=\u0026quot;http:\/\/www.w3.org\/1999\/xhtml\u0026quot; class=\u0026quot;caption-title\u0026quot;\u0026gt;Figure S1:\u0026lt;\/span\u0026gt; \u0026lt;\/div\u0026gt;\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003E\u003Cspan class=\u0022hw-responsive-img\u0022\u003E\u003Cimg class=\u0022highwire-fragment fragment-image lazyload\u0022 alt=\u0022Figure\u0022 src=\u0022data:image\/gif;base64,R0lGODlhAQABAIAAAAAAAP\/\/\/yH5BAEAAAAALAAAAAABAAEAAAIBRAA7\u0022 data-src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F4\/graphic-12.medium.gif\u0022 width=\u0022440\u0022 height=\u0022255\u0022\/\u003E\u003Cnoscript\u003E\u003Cimg class=\u0022highwire-fragment fragment-image\u0022 alt=\u0022Figure\u0022 src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F4\/graphic-12.medium.gif\u0022 width=\u0022440\u0022 height=\u0022255\u0022\/\u003E\u003C\/noscript\u003E\u003C\/span\u003E\u003C\/a\u003E\u003Cul class=\u0022highwire-figure-links inline\u0022\u003E\u003Cli class=\u0022download-fig first\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F4\/graphic-12.large.jpg?download=true\u0022 class=\u0022highwire-figure-link highwire-figure-link-download\u0022 title=\u0022Download \u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload figure\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022new-tab last\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F4\/graphic-12.large.jpg\u0022 class=\u0022highwire-figure-link highwire-figure-link-newtab\u0022 target=\u0022_blank\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EOpen in new tab\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv class=\u0022fig-caption\u0022\u003E\u003Cspan class=\u0022caption-title\u0022\u003EFigure S1:\u003C\/span\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cp id=\u0022p-51\u0022\u003EThe prompt returns a JSON-like response structured as:\u003C\/p\u003E\u003Cdiv id=\u0022F5\u0022 class=\u0022fig pos-float type-figure  odd\u0022\u003E\u003Cdiv class=\u0022highwire-figure\u0022\u003E\u003Cdiv class=\u0022fig-inline-img-wrapper\u0022\u003E\u003Cdiv class=\u0022fig-inline-img\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F5.large.jpg?width=800\u0026amp;height=600\u0026amp;carousel=1\u0022 title=\u0022\u0022 class=\u0022highwire-fragment fragment-images colorbox-load\u0022 rel=\u0022gallery-fragment-images-518782870\u0022 data-figure-caption=\u0022\u0026lt;div class=\u0026quot;highwire-markup\u0026quot;\u0026gt;\u0026lt;\/div\u0026gt;\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003E\u003Cspan class=\u0022hw-responsive-img\u0022\u003E\u003Cimg class=\u0022highwire-fragment fragment-image lazyload\u0022 alt=\u0022Figure\u0022 src=\u0022data:image\/gif;base64,R0lGODlhAQABAIAAAAAAAP\/\/\/yH5BAEAAAAALAAAAAABAAEAAAIBRAA7\u0022 data-src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F5.medium.gif\u0022 width=\u0022440\u0022 height=\u0022154\u0022\/\u003E\u003Cnoscript\u003E\u003Cimg class=\u0022highwire-fragment fragment-image\u0022 alt=\u0022Figure\u0022 src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F5.medium.gif\u0022 width=\u0022440\u0022 height=\u0022154\u0022\/\u003E\u003C\/noscript\u003E\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cul class=\u0022highwire-figure-links inline\u0022\u003E\u003Cli class=\u0022download-fig first\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F5.large.jpg?download=true\u0022 class=\u0022highwire-figure-link highwire-figure-link-download\u0022 title=\u0022Download Figure5\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload figure\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022new-tab last\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2025\/09\/01\/2025.07.01.25330655\/F5.large.jpg\u0022 class=\u0022highwire-figure-link highwire-figure-link-newtab\u0022 target=\u0022_blank\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EOpen in new tab\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv id=\u0022T6\u0022 class=\u0022table pos-float\u0022\u003E\u003Cdiv class=\u0022table-inline table-callout-links\u0022\u003E\u003Cdiv class=\u0022callout\u0022\u003E\u003Cspan\u003EView this table:\u003C\/span\u003E\u003Cul class=\u0022callout-links\u0022\u003E\u003Cli class=\u0022view-inline first\u0022\u003E\u003Ca href=\u0022\u0022 class=\u0022table-expand-inline\u0022 data-table-url=\u0022\/highwire\/markup\/1058820\/expansion?postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0026amp;table-expand-inline=1\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView inline\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022view-popup last\u0022\u003E\u003Ca href=\u0022\/highwire\/markup\/1058820\/expansion?width=1000\u0026amp;height=500\u0026amp;iframe=true\u0026amp;postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0022 class=\u0022colorbox colorbox-load table-expand-popup\u0022 rel=\u0022gallery-fragment-tables\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView popup\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv class=\u0022table-caption\u0022\u003E\u003Cspan class=\u0022table-label\u0022\u003ETable S1\u003C\/span\u003E \u003Cspan class=\u0022caption-title\u0022\u003E\u2013 Pairwise Agreement Across Sources\u003C\/span\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv id=\u0022T7\u0022 class=\u0022table pos-float\u0022\u003E\u003Cdiv class=\u0022table-inline table-callout-links\u0022\u003E\u003Cdiv class=\u0022callout\u0022\u003E\u003Cspan\u003EView this table:\u003C\/span\u003E\u003Cul class=\u0022callout-links\u0022\u003E\u003Cli class=\u0022view-inline first\u0022\u003E\u003Ca href=\u0022\u0022 class=\u0022table-expand-inline\u0022 data-table-url=\u0022\/highwire\/markup\/1058827\/expansion?postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0026amp;table-expand-inline=1\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView inline\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022view-popup last\u0022\u003E\u003Ca href=\u0022\/highwire\/markup\/1058827\/expansion?width=1000\u0026amp;height=500\u0026amp;iframe=true\u0026amp;postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0022 class=\u0022colorbox colorbox-load table-expand-popup\u0022 rel=\u0022gallery-fragment-tables\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView popup\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv class=\u0022table-caption\u0022\u003E\u003Cspan class=\u0022table-label\u0022\u003ETable S2\u003C\/span\u003E \u003Cspan class=\u0022caption-title\u0022\u003E\u2013 Agreement Matrix across all Evidence Sources\u003C\/span\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section fn-group\u0022 id=\u0022fn-group-1\u0022\u003E\u003Ch2\u003EFootnotes\u003C\/h2\u003E\u003Cul\u003E\u003Cli class=\u0022fn-update fn-group-summary-of-updates\u0022 id=\u0022fn-1\u0022\u003E\u003Cp id=\u0022p-13\u0022\u003EThis manuscript was revised to report the results of additional experiments:\n-An experiment evaluating the LLM-referenced citations for hallucination\n-An experiment evaluating the LLM-referenced snippet for hallucination\n-An experiment evaluating cross-LLM referenced citation for similarity\n-An ensemble approach to determining consensus between LLMs\n\u003C\/p\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section ref-list\u0022 id=\u0022ref-list-1\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EReferences\u003C\/h2\u003E\u003Col class=\u0022cit-list ref-use-labels\u0022\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E1.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-1-1\u0022 title=\u0022View reference 1. in text\u0022 id=\u0022ref-1\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.1\u0022 data-doi=\u002210.1136\/bmj.312.7023.71\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ESackett\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EDL\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ERosenberg\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EWM\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EGray\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EHaynes\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ERB\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ERichardson\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EWS\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EEvidence based medicine: what it is and what it isn\u2019t\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EBMJ\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E1996\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E312\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E7023\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E71\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E72\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1136\/bmj.312.7023.71\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DBMJ%26rft.stitle%253DBMJ%26rft.aulast%253DSackett%26rft.auinit1%253DD.%2BL%26rft.volume%253D312%26rft.issue%253D7023%26rft.spage%253D71%26rft.epage%253D72%26rft.atitle%253DEvidence%2Bbased%2Bmedicine%253A%2Bwhat%2Bit%2Bis%2Band%2Bwhat%2Bit%2Bisn%2527t%26rft_id%253Dinfo%253Adoi%252F10.1136%252Fbmj.312.7023.71%26rft_id%253Dinfo%253Apmid%252F8555924%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/ijlink\/YTozOntzOjQ6InBhdGgiO3M6MTQ6Ii9sb29rdXAvaWpsaW5rIjtzOjU6InF1ZXJ5IjthOjQ6e3M6ODoibGlua1R5cGUiO3M6NDoiRlVMTCI7czoxMToiam91cm5hbENvZGUiO3M6MzoiYm1qIjtzOjU6InJlc2lkIjtzOjExOiIzMTIvNzAyMy83MSI7czo0OiJhdG9tIjtzOjUwOiIvbWVkcnhpdi9lYXJseS8yMDI1LzA5LzAxLzIwMjUuMDcuMDEuMjUzMzA2NTUuYXRvbSI7fXM6ODoiZnJhZ21lbnQiO3M6MDoiIjt9\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-ijlink\u0022\u003E\u003Cspan\u003E\u003Cspan class=\u0022cit-reflinks-full-text\u0022\u003E\u003Cspan class=\u0022free-full-text\u0022\u003EFREE \u003C\/span\u003EFull Text\u003C\/span\u003E\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E2.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-2-1\u0022 title=\u0022View reference 2. in text\u0022 id=\u0022ref-2\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.2\u0022 data-doi=\u002210.1001\/JAMA.2019.1122\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EFanaroff\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EAC\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ECaliff\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ERM\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EWindecker\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ES\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ESmith\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ESC\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ELopes\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ERD\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003ELevels of Evidence Supporting American College of Cardiology\/American Heart Association and European Society of Cardiology Guidelines, 2008-2018\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJAMA\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2019\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E321\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E11\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E1069\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E1080\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1001\/jama.2019.1122\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJAMA%26rft.volume%253D321%26rft.spage%253D1069%26rft_id%253Dinfo%253Adoi%252F10.1001%252FJAMA.2019.1122%26rft_id%253Dinfo%253Apmid%252F30874755%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1001\/JAMA.2019.1122\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=30874755\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2025%2F09%2F01%2F2025.07.01.25330655.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E3.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-3-1\u0022 title=\u0022View reference 3. in text\u0022 id=\u0022ref-3\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.3\u0022 data-doi=\u002210.1186\/s13063-020-4139-0\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EHe\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJ\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EMorales\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EDR\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EGuthrie\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EB\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EExclusion rates in randomized controlled trials of treatments for physical conditions: a systematic review\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003ETrials\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2020\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E21\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E1\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E228\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1186\/s13063-020-4139-0\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DTrials%26rft.volume%253D21%26rft.spage%253D228%26rft_id%253Dinfo%253Adoi%252F10.1186%252Fs13063-020-4139-0%26rft_id%253Dinfo%253Apmid%252F32102686%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1186\/s13063-020-4139-0\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=32102686\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2025%2F09%2F01%2F2025.07.01.25330655.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E4.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-4-1\u0022 title=\u0022View reference 4. in text\u0022 id=\u0022ref-4\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.4\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EAlper\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EBS\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EHand\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EElliott\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ESG\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EHow much effort is needed to keep up with the literature relevant for primary care?\u003C\/span\u003E \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJ Med Libr Assoc\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2004\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E92\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E4\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E429\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E437\u003C\/span\u003E.\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJournal%2Bof%2Bthe%2BMedical%2BLibrary%2BAssociation%2B%253A%2B%2BJMLA%26rft.stitle%253DJ%2BMed%2BLibr%2BAssoc%26rft.aulast%253DAlper%26rft.auinit1%253DB.%2BS.%26rft.volume%253D92%26rft.issue%253D4%26rft.spage%253D429%26rft.epage%253D437%26rft.atitle%253DHow%2Bmuch%2Beffort%2Bis%2Bneeded%2Bto%2Bkeep%2Bup%2Bwith%2Bthe%2Bliterature%2Brelevant%2Bfor%2Bprimary%2Bcare%253F%26rft_id%253Dinfo%253Apmid%252F15494758%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=15494758\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2025%2F09%2F01%2F2025.07.01.25330655.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=000224486200010\u0026amp;link_type=ISI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-newisilink cit-ref-sprinkles-webofscience\u0022\u003E\u003Cspan\u003EWeb of Science\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E5.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-5-1\u0022 title=\u0022View reference 5. in text\u0022 id=\u0022ref-5\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.5\u0022 data-doi=\u002210.1007\/s10354-021-00849-3\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EWangler\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJ\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EJansky\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EM\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EWhat is the significance of guidelines in the primary care setting?\u003C\/span\u003E \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EWien Med Wochenschr\u003C\/abbr\u003E 1946. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2021\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E171\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E13-14\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E321\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E329\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1007\/s10354-021-00849-3\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DWien%2BMed%2BWochenschr%26rft.volume%253D171%26rft.spage%253D321%26rft_id%253Dinfo%253Adoi%252F10.1007%252Fs10354-021-00849-3%26rft_id%253Dinfo%253Apmid%252F34101082%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1007\/s10354-021-00849-3\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=34101082\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2025%2F09%2F01%2F2025.07.01.25330655.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E6.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-6-1\u0022 title=\u0022View reference 6. in text\u0022 id=\u0022ref-6\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.6\u0022 data-doi=\u002210.1056\/aioa2300068\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EZakka\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EC\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EShad\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ER\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EChaurasia\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EAlmanac \u2013 Retrieval-Augmented Language Models for Clinical Medicine\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003ENejm Ai\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2024\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E1\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E2\u003C\/span\u003E).\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1056\/aioa2300068\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DNejm%2BAi%26rft_id%253Dinfo%253Adoi%252F10.1056%252Faioa2300068%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1056\/aioa2300068\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E7.\u003C\/span\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal no-rev-xref\u0022 id=\u0022cit-2025.07.01.25330655v2.7\u0022 data-doi=\u002210.1001\/jamaoncol.2023.2954\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EChen\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ES\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EKann\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EBH\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EFoote\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EMB\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EUse of Artificial Intelligence Chatbots for Cancer Treatment Information\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJAMA Oncol\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2023\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E9\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E10\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E1459\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E1462\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1001\/jamaoncol.2023.2954\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJAMA%2BOncol%26rft.volume%253D9%26rft.spage%253D1459%26rft_id%253Dinfo%253Adoi%252F10.1001%252Fjamaoncol.2023.2954%26rft_id%253Dinfo%253Apmid%252F37615976%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1001\/jamaoncol.2023.2954\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=37615976\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2025%2F09%2F01%2F2025.07.01.25330655.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E8.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-8-1\u0022 title=\u0022View reference 8. in text\u0022 id=\u0022ref-8\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.8\u0022 data-doi=\u002210.1177\/20552076251348850\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ELow\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EYS\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EJackson\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EML\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EHyde\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ERJ\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EAnswering real-world clinical questions using large language model, retrieval-augmented generation, and agentic systems\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EDigit Health\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E11\u003C\/span\u003E:\u003Cspan class=\u0022cit-fpage\u0022\u003E20552076251348850\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1177\/20552076251348850\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DDigit%2BHealth%26rft.volume%253D11%26rft.spage%253D20552076251348850%26rft_id%253Dinfo%253Adoi%252F10.1177%252F20552076251348850%26rft_id%253Dinfo%253Apmid%252F40510193%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1177\/20552076251348850\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=40510193\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2025%2F09%2F01%2F2025.07.01.25330655.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E9.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-9-1\u0022 title=\u0022View reference 9. in text\u0022 id=\u0022ref-9\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.9\u0022 data-doi=\u002210.2196\/53164\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EChelli\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EM\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EDescamps\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJ\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ELavou\u00e9\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EV\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EHallucination Rates and Reference Accuracy of ChatGPT and Bard for Systematic Reviews: Comparative Analysis\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJ Med Internet Res\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2024\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E26\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E1\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003Ee53164\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.2196\/53164\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJ%2BMed%2BInternet%2BRes%26rft.volume%253D26%26rft.spage%253De53164%26rft_id%253Dinfo%253Adoi%252F10.2196%252F53164%26rft_id%253Dinfo%253Apmid%252F38776130%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.2196\/53164\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=38776130\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2025%2F09%2F01%2F2025.07.01.25330655.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E10.\u003C\/span\u003E\u003Cdiv class=\u0022cit ref-cit ref-web no-rev-xref\u0022 id=\u0022cit-2025.07.01.25330655v2.10\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth cit-collab\u0022\u003EOpenEvidence\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EOpenEvidence \u2013 OpenEvidence AI becomes the first AI in history to score above 90% on the United States Medical Licensing Examination (USMLE)\u003C\/span\u003E. \u003Cspan class=\u0022cit-source\u0022\u003EOpenEvidence\u003C\/span\u003E. Accessed June 30, \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E. \u003Ca href=\u0022https:\/\/www.openevidence.com\/announcements\/openevidence-ai-first-ai-score-above-90-percent-on-the-usmle\u0022\u003Ehttps:\/\/www.openevidence.com\/announcements\/openevidence-ai-first-ai-score-above-90-percent-on-the-usmle\u003C\/a\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E11.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-11-1\u0022 title=\u0022View reference 11. in text\u0022 id=\u0022ref-11\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-web\u0022 id=\u0022cit-2025.07.01.25330655v2.11\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth cit-collab\u0022\u003EPerformance of ChatGPT on USMLE\u003C\/span\u003E: \u003Cspan class=\u0022cit-article-title\u0022\u003EPotential for AI-assisted medical education using large language models\u003C\/span\u003E | \u003Cspan class=\u0022cit-source\u0022\u003EPLOS Digital Health\u003C\/span\u003E. Accessed June 30, \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E. \u003Ca href=\u0022https:\/\/journals.plos.org\/digitalhealth\/article?id=10.1371\/journal.pdig.0000198\u0022\u003Ehttps:\/\/journals.plos.org\/digitalhealth\/article?id=10.1371\/journal.pdig.0000198\u003C\/a\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E12.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-12-1\u0022 title=\u0022View reference 12. in text\u0022 id=\u0022ref-12\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.12\u0022 data-doi=\u002210.1001\/jamanetworkopen.2025.26021\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EBedi\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ES\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EJiang\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EY\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EChung\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EP\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EKoyejo\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ES\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EShah\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EN\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EFidelity of Medical Reasoning in Large Language Models\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJAMA Netw Open\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E8\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E8\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003Ee2526021\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1001\/jamanetworkopen.2025.26021\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJAMA%2BNetw%2BOpen%26rft.volume%253D8%26rft.spage%253D2526021e%26rft_id%253Dinfo%253Adoi%252F10.1001%252Fjamanetworkopen.2025.26021%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1001\/jamanetworkopen.2025.26021\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E13.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-13-1\u0022 title=\u0022View reference 13. in text\u0022 id=\u0022ref-13\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-web\u0022 id=\u0022cit-2025.07.01.25330655v2.13\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth cit-collab\u0022\u003EPerplexity\u003C\/span\u003E. \u003Cspan class=\u0022cit-source\u0022\u003EPerplexity AI\u003C\/span\u003E. Accessed June 30, \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E. \u003Ca href=\u0022https:\/\/www.perplexity.ai\u0022\u003Ehttps:\/\/www.perplexity.ai\u003C\/a\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E14.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-14-1\u0022 title=\u0022View reference 14. in text\u0022 id=\u0022ref-14\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-web\u0022 id=\u0022cit-2025.07.01.25330655v2.14\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth cit-collab\u0022\u003EGraph\u003C\/span\u003E. Accessed June 30, \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E. \u003Ca href=\u0022https:\/\/www.system.com\/platform\/system-graph\u0022\u003Ehttps:\/\/www.system.com\/platform\/system-graph\u003C\/a\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E15.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-15-1\u0022 title=\u0022View reference 15. in text\u0022 id=\u0022ref-15\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.15\u0022 data-doi=\u002210.48550\/arXiv.2505.23802\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EBedi\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ES\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ECui\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EH\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EFuentes\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EM\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EMedHELM: Holistic Evaluation of Large Language Models for Medical Tasks\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EarXiv\u003C\/abbr\u003E. Preprint posted online June 2, \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.48550\/arXiv.2505.23802\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DarXiv%26rft_id%253Dinfo%253Adoi%252F10.48550%252FarXiv.2505.23802%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.48550\/arXiv.2505.23802\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E16.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-16-1\u0022 title=\u0022View reference 16. in text\u0022 id=\u0022ref-16\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.16\u0022 data-doi=\u002210.1038\/s41746-024-01258-7\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ETam\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ETYC\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ESivarajkumar\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ES\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EKapoor\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ES\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EA framework for human evaluation of large language models in healthcare derived from literature review\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003ENpj Digit Med\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2024\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E7\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E1\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E258\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1038\/s41746-024-01258-7\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DNpj%2BDigit%2BMed%26rft.volume%253D7%26rft.spage%253D258%26rft_id%253Dinfo%253Adoi%252F10.1038%252Fs41746-024-01258-7%26rft_id%253Dinfo%253Apmid%252F39333376%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1038\/s41746-024-01258-7\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=39333376\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2025%2F09%2F01%2F2025.07.01.25330655.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E17.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-17-1\u0022 title=\u0022View reference 17. in text\u0022 id=\u0022ref-17\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.17\u0022 data-doi=\u002210.1038\/s41746-019-0091-3\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EGombar\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ES\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ECallahan\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ECaliff\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ER\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EHarrington\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ER\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EShah\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ENH\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EIt is time to learn from patients like mine\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003ENpj Digit Med\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2019\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E2\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E1\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E16\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1038\/s41746-019-0091-3\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DNpj%2BDigit%2BMed%26rft.volume%253D2%26rft.spage%253D16%26rft_id%253Dinfo%253Adoi%252F10.1038%252Fs41746-019-0091-3%26rft_id%253Dinfo%253Apmid%252F31304364%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1038\/s41746-019-0091-3\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=31304364\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2025%2F09%2F01%2F2025.07.01.25330655.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E18.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-18-1\u0022 title=\u0022View reference 18. in text\u0022 id=\u0022ref-18\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.18\u0022 data-doi=\u002210.1056\/CAT.21.0224\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ECallahan\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EGombar\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ES\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ECahan\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EEM\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EUsing Aggregate Patient Data at the Bedside via an On-Demand Consultation Service\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003ENEJM Catal\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2021\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E2\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E10\u003C\/span\u003E).\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1056\/CAT.21.0224\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DNEJM%2BCatal%26rft_id%253Dinfo%253Adoi%252F10.1056%252FCAT.21.0224%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1056\/CAT.21.0224\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E19.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-19-1\u0022 title=\u0022View reference 19. in text\u0022 id=\u0022ref-19\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-web\u0022 id=\u0022cit-2025.07.01.25330655v2.19\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth cit-collab\u0022\u003EHome \\ Anthropic\u003C\/span\u003E. Accessed August 28, 2025. \u003Ca href=\u0022https:\/\/www.anthropic.com\/\u0022\u003Ehttps:\/\/www.anthropic.com\/\u003C\/a\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E20.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-20-1\u0022 title=\u0022View reference 20. in text\u0022 id=\u0022ref-20\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-web\u0022 id=\u0022cit-2025.07.01.25330655v2.20\u0022 data-doi=\u002210.48550\/arXiv.2005.11401\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ELewis\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EP\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EPerez\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EE\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EPiktus\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003ERetrieval-Augmented Generation for Knowledge-Intensive NLP Tasks\u003C\/span\u003E. \u003Cspan class=\u0022cit-source\u0022\u003EarXiv\u003C\/span\u003E. Preprint posted online April 12, \u003Cspan class=\u0022cit-pub-date\u0022\u003E2021\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.48550\/arXiv.2005.11401\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DarXiv%26rft_id%253Dinfo%253Adoi%252F10.48550%252FarXiv.2005.11401%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.48550\/arXiv.2005.11401\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E21.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-21-1\u0022 title=\u0022View reference 21. in text\u0022 id=\u0022ref-21\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.21\u0022 data-doi=\u002210.1377\/hlthaff.26.2.w181\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EStewart\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EWF\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EShah\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ENR\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ESelna\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EMJ\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EPaulus\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ERA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EWalker\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJM\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EBridging the inferential gap: the electronic health record and clinical evidence\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EHealth Aff Proj Hope\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2007\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E26\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E2\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003Ew181\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E191\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1377\/hlthaff.26.2.w181\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DHealth%2BAff%2BProj%2BHope%26rft_id%253Dinfo%253Adoi%252F10.1377%252Fhlthaff.26.2.w181%26rft_id%253Dinfo%253Apmid%252F17259202%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/ijlink\/YTozOntzOjQ6InBhdGgiO3M6MTQ6Ii9sb29rdXAvaWpsaW5rIjtzOjU6InF1ZXJ5IjthOjQ6e3M6ODoibGlua1R5cGUiO3M6NDoiQUJTVCI7czoxMToiam91cm5hbENvZGUiO3M6OToiaGVhbHRoYWZmIjtzOjU6InJlc2lkIjtzOjk6IjI2LzIvdzE4MSI7czo0OiJhdG9tIjtzOjUwOiIvbWVkcnhpdi9lYXJseS8yMDI1LzA5LzAxLzIwMjUuMDcuMDEuMjUzMzA2NTUuYXRvbSI7fXM6ODoiZnJhZ21lbnQiO3M6MDoiIjt9\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-ijlink\u0022\u003E\u003Cspan\u003E\u003Cspan class=\u0022cit-reflinks-abstract\u0022\u003EAbstract\u003C\/span\u003E\u003Cspan class=\u0022cit-sep cit-reflinks-variant-name-sep\u0022\u003E\/\u003C\/span\u003E\u003Cspan class=\u0022cit-reflinks-full-text\u0022\u003E\u003Cspan class=\u0022free-full-text\u0022\u003EFREE \u003C\/span\u003EFull Text\u003C\/span\u003E\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E22.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-22-1\u0022 title=\u0022View reference 22. in text\u0022 id=\u0022ref-22\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.22\u0022 data-doi=\u002210.1111\/j.1747-0803.2010.00433.x\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EDarst\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJR\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ENewburger\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJW\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EResch\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ES\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ERathod\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ERH\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ELock\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJE\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EDeciding without data\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003ECongenit Heart Dis\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2010\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E5\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E4\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E339\u003C\/span\u003E-\u003Cspan class=\u0022cit-lpage\u0022\u003E342\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1111\/j.1747-0803.2010.00433.x\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.stitle%253DCongenit%2BHeart%2BDis%26rft.aulast%253DDarst%26rft.auinit1%253DJ.%2BR.%26rft.volume%253D5%26rft.issue%253D4%26rft.spage%253D339%26rft.epage%253D342%26rft.atitle%253DDeciding%2Bwithout%2Bdata.%26rft_id%253Dinfo%253Adoi%252F10.1111%252Fj.1747-0803.2010.00433.x%26rft_id%253Dinfo%253Apmid%252F20653700%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1111\/j.1747-0803.2010.00433.x\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=20653700\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2025%2F09%2F01%2F2025.07.01.25330655.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=000289419800003\u0026amp;link_type=ISI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-newisilink cit-ref-sprinkles-webofscience\u0022\u003E\u003Cspan\u003EWeb of Science\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E23.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-23-1\u0022 title=\u0022View reference 23. in text\u0022 id=\u0022ref-23\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2025.07.01.25330655v2.23\u0022 data-doi=\u002210.3389\/fdata.2025.1611389\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EBaysan\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EMS\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EUysal\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ES\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003E\u0130\u015flek\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003E\u0130\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003E\u00c7\u0131\u011f Karaman\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003E\u00c7\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EG\u00fcng\u00f6r\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ET\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003ELLM-as-a-Judge: automated evaluation of search query parsing using large language models\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EFront Big Data\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E8\u003C\/span\u003E:\u003Cspan class=\u0022cit-fpage\u0022\u003E1611389\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.3389\/fdata.2025.1611389\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DFront%2BBig%2BData%26rft.volume%253D8%26rft.spage%253D1611389%26rft_id%253Dinfo%253Adoi%252F10.3389%252Ffdata.2025.1611389%26rft_id%253Dinfo%253Apmid%252F40761620%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.3389\/fdata.2025.1611389\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=40761620\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2025%2F09%2F01%2F2025.07.01.25330655.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003C\/ol\u003E\u003C\/div\u003E\u003Cspan class=\u0022highwire-journal-article-marker-end\u0022\u003E\u003C\/span\u003E\u003C\/div\u003E\u003Cspan class=\u0022related-urls\u0022\u003E\u003C\/span\u003E\u003C\/div\u003E\u003C\/div\u003E  \u003C\/div\u003E\n\n  \n  \u003C\/div\u003E\n\u003C\/div\u003E\n  \u003C\/div\u003E\n\u003C\/div\u003E\n\u003C\/div\u003E\u003Cscript type=\u0022text\/javascript\u0022 src=\u0022https:\/\/www.medrxiv.org\/sites\/default\/files\/js\/js_zP7WWIfzbyzvaM63L39cNV2juU_1XVH7wduFK9gcMNI.js\u0022\u003E\u003C\/script\u003E\n\u003C\/body\u003E\u003C\/html\u003E"}