{"markup":"\u003C?xml version=\u00221.0\u0022 encoding=\u0022UTF-8\u0022 ?\u003E\n    \u003Chtml version=\u0022HTML+RDFa+MathML 1.1\u0022\n    xmlns:content=\u0022http:\/\/purl.org\/rss\/1.0\/modules\/content\/\u0022\n    xmlns:dc=\u0022http:\/\/purl.org\/dc\/terms\/\u0022\n    xmlns:foaf=\u0022http:\/\/xmlns.com\/foaf\/0.1\/\u0022\n    xmlns:og=\u0022http:\/\/ogp.me\/ns#\u0022\n    xmlns:rdfs=\u0022http:\/\/www.w3.org\/2000\/01\/rdf-schema#\u0022\n    xmlns:sioc=\u0022http:\/\/rdfs.org\/sioc\/ns#\u0022\n    xmlns:sioct=\u0022http:\/\/rdfs.org\/sioc\/types#\u0022\n    xmlns:skos=\u0022http:\/\/www.w3.org\/2004\/02\/skos\/core#\u0022\n    xmlns:xsd=\u0022http:\/\/www.w3.org\/2001\/XMLSchema#\u0022\n    xmlns:mml=\u0022http:\/\/www.w3.org\/1998\/Math\/MathML\u0022\u003E\n  \u003Chead\u003E\u003Cscript type=\u0022text\/javascript\u0022 src=\u0022\/\/cdn.jsdelivr.net\/qtip2\/2.2.1\/jquery.qtip.min.js\u0022\u003E\u003C\/script\u003E\n\u003Cscript type=\u0022text\/javascript\u0022 src=\u0022https:\/\/www.medrxiv.org\/sites\/default\/files\/js\/js_YjAJQgxDlFX6S-O02jj9jCrVbrwlY3CGgCg1FzPlvBs.js\u0022\u003E\u003C\/script\u003E\n\u003Cscript type=\u0022text\/javascript\u0022\u003E\n\u003C!--\/\/--\u003E\u003C![CDATA[\/\/\u003E\u003C!--\nif(typeof window.MathJax === \u0022undefined\u0022) window.MathJax = { menuSettings: { zoom: \u0022Click\u0022 } };\n\/\/--\u003E\u003C!]]\u003E\n\u003C\/script\u003E\n\u003Cscript type=\u0022text\/javascript\u0022 src=\u0022https:\/\/www.medrxiv.org\/sites\/default\/files\/js\/js_waP91NpgGpectm_6Y2XDEauLJ8WCSCBKmmA87unpp2E.js\u0022\u003E\u003C\/script\u003E\n\u003Cscript type=\u0022text\/javascript\u0022 src=\u0022https:\/\/www.googletagmanager.com\/gtag\/js?id=G-0K57TCX5BY\u0022\u003E\u003C\/script\u003E\n\u003Cscript type=\u0022text\/javascript\u0022\u003E\n\u003C!--\/\/--\u003E\u003C![CDATA[\/\/\u003E\u003C!--\nwindow.dataLayer = window.dataLayer || [];function gtag(){dataLayer.push(arguments)};gtag(\u0022js\u0022, new Date());gtag(\u0022set\u0022, \u0022developer_id.dMDhkMT\u0022, true);gtag(\u0022config\u0022, \u0022G-0K57TCX5BY\u0022, {\u0022groups\u0022:\u0022default\u0022,\u0022anonymize_ip\u0022:true});\n\/\/--\u003E\u003C!]]\u003E\n\u003C\/script\u003E\n\u003Cscript type=\u0022text\/javascript\u0022\u003E\n\u003C!--\/\/--\u003E\u003C![CDATA[\/\/\u003E\u003C!--\njQuery.extend(Drupal.settings, {\u0022basePath\u0022:\u0022\\\/\u0022,\u0022pathPrefix\u0022:\u0022\u0022,\u0022highwire\u0022:{\u0022ac\u0022:{\u0022medrxiv;2026.03.23.26349012v1\u0022:{\u0022access\u0022:{\u0022full\u0022:true},\u0022pisa_id\u0022:\u0022medrxiv;2026.03.23.26349012v1\u0022,\u0022apath\u0022:\u0022\u0022,\u0022jcode\u0022:\u0022medrxiv\u0022}},\u0022processed\u0022:[\u0022highwire_math\u0022],\u0022markup\u0022:[{\u0022requested\u0022:\u0022full-text\u0022,\u0022variant\u0022:\u0022full-text\u0022,\u0022view\u0022:\u0022full\u0022,\u0022pisa\u0022:\u0022medrxiv;2026.03.23.26349012v1\u0022}]},\u0022instances\u0022:\u0022{\\u0022highwire_abstract_tooltip\\u0022:{\\u0022content\\u0022:{\\u0022text\\u0022:\\u0022\\u0022},\\u0022style\\u0022:{\\u0022tip\\u0022:{\\u0022width\\u0022:20,\\u0022height\\u0022:20,\\u0022border\\u0022:1,\\u0022offset\\u0022:0,\\u0022corner\\u0022:true},\\u0022classes\\u0022:\\u0022qtip-custom hw-tooltip hw-abstract-tooltip qtip-shadow qtip-rounded\\u0022,\\u0022classes_custom\\u0022:\\u0022hw-tooltip hw-abstract-tooltip\\u0022},\\u0022position\\u0022:{\\u0022at\\u0022:\\u0022right center\\u0022,\\u0022my\\u0022:\\u0022left center\\u0022,\\u0022viewport\\u0022:true,\\u0022adjust\\u0022:{\\u0022method\\u0022:\\u0022shift\\u0022}},\\u0022show\\u0022:{\\u0022event\\u0022:\\u0022mouseenter click \\u0022,\\u0022solo\\u0022:true},\\u0022hide\\u0022:{\\u0022event\\u0022:\\u0022mouseleave \\u0022,\\u0022fixed\\u0022:1,\\u0022delay\\u0022:\\u0022100\\u0022}},\\u0022highwire_author_tooltip\\u0022:{\\u0022content\\u0022:{\\u0022text\\u0022:\\u0022\\u0022},\\u0022style\\u0022:{\\u0022tip\\u0022:{\\u0022width\\u0022:15,\\u0022height\\u0022:15,\\u0022border\\u0022:1,\\u0022offset\\u0022:0,\\u0022corner\\u0022:true},\\u0022classes\\u0022:\\u0022qtip-custom hw-tooltip hw-author-tooltip qtip-shadow qtip-rounded\\u0022,\\u0022classes_custom\\u0022:\\u0022hw-tooltip hw-author-tooltip\\u0022},\\u0022position\\u0022:{\\u0022at\\u0022:\\u0022top center\\u0022,\\u0022my\\u0022:\\u0022bottom center\\u0022,\\u0022viewport\\u0022:true,\\u0022adjust\\u0022:{\\u0022method\\u0022:\\u0022\\u0022}},\\u0022show\\u0022:{\\u0022event\\u0022:\\u0022mouseenter \\u0022,\\u0022solo\\u0022:true},\\u0022hide\\u0022:{\\u0022event\\u0022:\\u0022mouseleave \\u0022,\\u0022fixed\\u0022:1,\\u0022delay\\u0022:\\u0022100\\u0022}},\\u0022highwire_reflinks_tooltip\\u0022:{\\u0022content\\u0022:{\\u0022text\\u0022:\\u0022\\u0022},\\u0022style\\u0022:{\\u0022tip\\u0022:{\\u0022width\\u0022:15,\\u0022height\\u0022:15,\\u0022border\\u0022:1,\\u0022mimic\\u0022:\\u0022top center\\u0022,\\u0022offset\\u0022:0,\\u0022corner\\u0022:true},\\u0022classes\\u0022:\\u0022qtip-custom hw-tooltip hw-ref-link-tooltip qtip-shadow qtip-rounded\\u0022,\\u0022classes_custom\\u0022:\\u0022hw-tooltip hw-ref-link-tooltip\\u0022},\\u0022position\\u0022:{\\u0022at\\u0022:\\u0022bottom left\\u0022,\\u0022my\\u0022:\\u0022top left\\u0022,\\u0022viewport\\u0022:true,\\u0022adjust\\u0022:{\\u0022method\\u0022:\\u0022flip\\u0022}},\\u0022show\\u0022:{\\u0022event\\u0022:\\u0022mouseenter \\u0022,\\u0022solo\\u0022:true},\\u0022hide\\u0022:{\\u0022event\\u0022:\\u0022mouseleave \\u0022,\\u0022fixed\\u0022:1,\\u0022delay\\u0022:\\u0022100\\u0022}}}\u0022,\u0022qtipDebug\u0022:\u0022{\\u0022leaveElement\\u0022:0}\u0022,\u0022googleanalytics\u0022:{\u0022account\u0022:[\u0022G-0K57TCX5BY\u0022],\u0022trackOutbound\u0022:1,\u0022trackMailto\u0022:1,\u0022trackDownload\u0022:1,\u0022trackDownloadExtensions\u0022:\u00227z|aac|arc|arj|asf|asx|avi|bin|csv|doc(x|m)?|dot(x|m)?|exe|flv|gif|gz|gzip|hqx|jar|jpe?g|js|mp(2|3|4|e?g)|mov(ie)?|msi|msp|pdf|phps|png|ppt(x|m)?|pot(x|m)?|pps(x|m)?|ppam|sld(x|m)?|thmx|qtm?|ra(m|r)?|sea|sit|tar|tgz|torrent|txt|wav|wma|wmv|wpd|xls(x|m|b)?|xlt(x|m)|xlam|xml|z|zip\u0022,\u0022trackColorbox\u0022:1},\u0022ajaxPageState\u0022:{\u0022js\u0022:{\u0022\\\/\\\/cdn.jsdelivr.net\\\/qtip2\\\/2.2.1\\\/jquery.qtip.min.js\u0022:1,\u0022sites\\\/all\\\/modules\\\/highwire\\\/highwire\\\/plugins\\\/highwire_markup_process\\\/js\\\/highwire_article_reference_popup.js\u0022:1,\u0022sites\\\/all\\\/modules\\\/highwire\\\/highwire\\\/plugins\\\/highwire_markup_process\\\/js\\\/highwire_at_symbol.js\u0022:1,\u00220\u0022:1,\u0022sites\\\/all\\\/modules\\\/contrib\\\/google_analytics\\\/googleanalytics.js\u0022:1,\u0022https:\\\/\\\/www.googletagmanager.com\\\/gtag\\\/js?id=G-0K57TCX5BY\u0022:1,\u00221\u0022:1}}});\n\/\/--\u003E\u003C!]]\u003E\n\u003C\/script\u003E\n\u003Clink type=\u0022text\/css\u0022 rel=\u0022stylesheet\u0022 href=\u0022https:\/\/www.medrxiv.org\/sites\/default\/files\/advagg_css\/css__dn-cpI1YtkU_iLHgA5WhlkxgYWyat_IxjF_B-WSYrpE__a9hIbt0eaZ7d5nhwnm2weG8R_2eXK4EvoOx9dOxouHE__QrrGUc7CpljPR5Aph-ukPbcwtK4AWrHGwCEXJ_k1V_c.css\u0022 media=\u0022all\u0022 \/\u003E\n\u003Clink type=\u0022text\/css\u0022 rel=\u0022stylesheet\u0022 href=\u0022\/\/cdn.jsdelivr.net\/qtip2\/2.2.1\/jquery.qtip.min.css\u0022 media=\u0022all\u0022 \/\u003E\n\u003Clink type=\u0022text\/css\u0022 rel=\u0022stylesheet\u0022 href=\u0022https:\/\/www.medrxiv.org\/sites\/default\/files\/advagg_css\/css__HGACIFBlu2o05y3afvqlt5wrE_5Dn6MXsexfuEpeIwg__t4SOPxucAPoV3Os7g8dXqyMB1HRXQridRJ82X7nE33E__QrrGUc7CpljPR5Aph-ukPbcwtK4AWrHGwCEXJ_k1V_c.css\u0022 media=\u0022all\u0022 \/\u003E\n\u003Clink rel=\u0027stylesheet\u0027 type=\u0027text\/css\u0027 href=\u0027\/sites\/all\/modules\/contrib\/panels\/plugins\/layouts\/onecol\/onecol.css\u0027 \/\u003E\u003C\/head\u003E\u003Cbody\u003E\u003Cdiv class=\u0022panels-ajax-tab-panel panels-ajax-tab-panel-article-tab-full-text\u0022\u003E\u003Cdiv class=\u0022panel-display panel-1col clearfix\u0022 \u003E\n  \u003Cdiv class=\u0022panel-panel panel-col\u0022\u003E\n    \u003Cdiv\u003E\u003Cdiv class=\u0022panel-pane pane-highwire-markup\u0022 \u003E\n  \n      \n  \n  \u003Cdiv class=\u0022pane-content\u0022\u003E\n    \u003Cdiv class=\u0022highwire-markup\u0022\u003E\u003Cdiv xmlns=\u0022http:\/\/www.w3.org\/1999\/xhtml\u0022 data-highwire-cite-ref-tooltip-instance=\u0022highwire_reflinks_tooltip\u0022 class=\u0022content-block-markup\u0022 xmlns:xhtml=\u0022http:\/\/www.w3.org\/1999\/xhtml\u0022\u003E\u003Cdiv class=\u0022article fulltext-view \u0022\u003E\u003Cspan class=\u0022highwire-journal-article-marker-start\u0022\u003E\u003C\/span\u003E\u003Cdiv class=\u0022section abstract\u0022 id=\u0022abstract-1\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EAbstract\u003C\/h2\u003E\u003Cdiv id=\u0022sec-1\u0022 class=\u0022subsection\u0022\u003E\u003Cp id=\u0022p-2\u0022\u003E\u003Cstrong\u003EBackground\u003C\/strong\u003E Manual chart abstraction is a major bottleneck in clinical research. In oncology, important outcomes such as disease recurrence and the treatment history are often only documented in clinical notes, limiting the scale and quality of observational and epidemiologic studies. We developed an open-source pipeline that, in a HIPAA-compliant setting, can use any commercially available large language model (LLM) to abstract variables. We sought to understand if a wide range of variables could be abstracted from complex longitudinal oncology records with performance similar to that of expert medical oncologists.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv id=\u0022sec-2\u0022 class=\u0022subsection\u0022\u003E\u003Cp id=\u0022p-3\u0022\u003E\u003Cstrong\u003EMethods\u003C\/strong\u003E We randomly selected 100 patients from an institutional breast cancer cohort enriched for complex care. We abstracted a range of key variables from unstructured data, including dates of diagnosis and recurrence, clinical stage, biomarker subtype, genetic testing results, and prescribed systemic therapies, including treatment timing, intent, and reason for discontinuation. The inputs to the LLMs were unnormalized, unlabeled, and unedited clinical notes, pathology reports, med admin records, and demographics. Breast oncologists abstracted the same variables to create the reference standard. For systemic therapy extraction, a second oncologist and research coordinators served as comparators. In addition to variable-level performance, we examined whether survival and hazard-ratio estimates were similar for fully LLM-derived datasets compared with expert-derived datasets.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv id=\u0022sec-3\u0022 class=\u0022subsection\u0022\u003E\u003Cp id=\u0022p-4\u0022\u003E\u003Cstrong\u003EResults\u003C\/strong\u003E Among 100 patients, the median chart had more than 3,100 pages of text; patients received a median of 7 lines of therapy over 6.5 years of follow-up. The best-performing LLM achieved 99% concordance with the expert for recurrence status, 100% for germline BRCA1\/2 pathogenic variant detection, 99% for hormone receptor status, 96% for HER2 status, 91% for clinical stage, 91% for PIK3CA mutation status, and 90% for ESR1 mutation status. For anti-cancer drug extraction, the best-performing LLM approached inter-oncologist variability. For exact therapy-line reconstruction, mean patient-level performance remained 9 percentage points lower than the second oncologist, although inter-LLM disagreement was similar to inter-oncologist disagreement. All four LLMs tested outperformed the research coordinators on systemic therapy abstraction. Recurrence-free survival, overall survival, and hazard ratio estimates were similar between expert-derived and LLM-derived datasets. In an external cohort of 97 young patients with early-stage breast cancer, the unmodified pipeline showed similar performance for recurrence detection and adjuvant endocrine therapy use.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv id=\u0022sec-4\u0022 class=\u0022subsection\u0022\u003E\u003Cp id=\u0022p-5\u0022\u003E\u003Cstrong\u003EConclusions\u003C\/strong\u003E Off-the-shelf general-purpose LLMs in a fixed retrieval pipeline were able to abstract a range of variables from complex longitudinal oncology records with performance approaching inter-oncologist variability for key tasks, without any fine-tuning or institution-specific retraining. This approach offers a practical path to scaling the creation of research-grade retrospective datasets from narrative medical records.\u003C\/p\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-5\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EIntroduction\u003C\/h2\u003E\u003Cp id=\u0022p-18\u0022\u003EClinical research depends on abstracting key variables from the electronic medical record and converting them into structured data for analysis.\u003Csup\u003E\u003Ca id=\u0022xref-ref-1-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-1\u0022\u003E1\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-2-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-2\u0022\u003E2\u003C\/a\u003E\u003C\/sup\u003E This manual process is how we build disease registries, retrospective cohorts, and many real-world evidence datasets. Abstracting information from the chart is labor-intensive and vulnerable to inconsistency across reviewers. Many key variables such as diagnoses, outcomes, biomarker results, treatment exposures, and disease progression are often documented only in free text rather than in structured fields. As a result, much of the clinically meaningful information in the narrative record is not currently used for research, which limits the completeness and quality of observational datasets.\u003Csup\u003E\u003Ca id=\u0022xref-ref-3-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-3\u0022\u003E3\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-4-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-4\u0022\u003E4\u003C\/a\u003E\u003C\/sup\u003E\u003C\/p\u003E\u003Cp id=\u0022p-19\u0022\u003EBreast cancer illustrates this problem clearly. Most metastatic breast cancers are recurrences of earlier-stage disease, but SEER only captures initial treatment for patients with \u003Cem\u003Ede novo\u003C\/em\u003E metastatic disease, who represent just 6% of new breast diagnoses.\u003Csup\u003E\u003Ca id=\u0022xref-ref-5-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-5\u0022\u003E5\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-6-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-6\u0022\u003E6\u003C\/a\u003E\u003C\/sup\u003E As a result, population-level estimates of metastatic breast cancer burden in the United States depend on simulation models and claims-based inference.\u003Csup\u003E\u003Ca id=\u0022xref-ref-5-2\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-5\u0022\u003E5\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-7-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-7\u0022\u003E7\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-8-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-8\u0022\u003E8\u003C\/a\u003E\u003C\/sup\u003E Retrospective studies that inform clinical decision-making often rely on labor-intensive manual abstraction of smaller-than-ideal cohorts because identifying cancer recurrence is challenging at scale.\u003Csup\u003E\u003Ca id=\u0022xref-ref-9-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-9\u0022\u003E9\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-10-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-10\u0022\u003E10\u003C\/a\u003E\u003C\/sup\u003E Answering the full range of clinically meaningful questions through manual chart review is impossible.\u003C\/p\u003E\u003Cp id=\u0022p-20\u0022\u003ELarge language models (LLMs) may offer a practical way to automate this work. To date, most approaches have relied on proprietary systems or developing task-specific models trained on institutional data. These approaches limit the reproducibility, portability, and local control over protected health information.\u003Csup\u003E\u003Ca id=\u0022xref-ref-11-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-11\u0022\u003E11\u003C\/a\u003E-\u003Ca id=\u0022xref-ref-14-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-14\u0022\u003E14\u003C\/a\u003E\u003C\/sup\u003E Therefore, we sought to understand if off-the-shelf general-purpose LLMs (e.g. ChatGPT, Gemini), available to many healthcare systems today in HIPAA-compliant environments, can reliably abstract complex longitudinal cancer records without fine-tuning, labeled training data, or institution-specific retraining.\u003Csup\u003E\u003Ca id=\u0022xref-ref-15-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-15\u0022\u003E15\u003C\/a\u003E\u003C\/sup\u003E If successful, this approach could provide a practical path toward unlocking large volumes of clinical data for research.\u003C\/p\u003E\u003Cp id=\u0022p-21\u0022\u003EWe developed a chart abstraction pipeline able to use commercially available LLMs and applied it to patients with complex breast cancer histories. We compared the performance of the LLM-derived abstraction with expert oncologist review for recurrence, systemic therapy, tumor characteristics, and genomic testing across multiple LLMs. We chose a wide range of tasks to understand if the design was flexible, and to capture the key variables often missing from observational cancer datasets. Because it was unclear how to best measure abstraction of systemic therapies, we decided to benchmark this task to a second oncologist and to research coordinators. Lastly, we assessed if LLM-derived datasets preserved downstream survival and epidemiologic inference.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-6\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EMethods\u003C\/h2\u003E\u003Cdiv id=\u0022sec-7\u0022 class=\u0022subsection\u0022\u003E\u003Ch3\u003EStudy design and objectives\u003C\/h3\u003E\u003Cp id=\u0022p-22\u0022\u003EWe compared a fully automated retrieval-based pipeline using commercially available LLMs to expert oncologist chart review for a range of variables (\u003Ca id=\u0022xref-table-wrap-1-1\u0022 class=\u0022xref-table\u0022 href=\u0022#T1\u0022\u003ETable 1\u003C\/a\u003E). The primary endpoints were agreement between LLM-derived and expert-derived data on cancer recurrence, including whether recurrence occurred and its timing, and on the number and composition of systemic treatment lines. Secondary endpoints were agreement on other clinical variables, comparison with research coordinators for selected variables, inter-oncologist variability in systemic therapy abstraction, and preservation of downstream inference when fully LLM-derived datasets were substituted for expert-derived datasets. This study was approved by the Stanford IRB under protocol 19482.\u003C\/p\u003E\u003Cdiv id=\u0022T1\u0022 class=\u0022table pos-float\u0022\u003E\u003Cdiv class=\u0022table-inline table-callout-links\u0022\u003E\u003Cdiv class=\u0022callout\u0022\u003E\u003Cspan\u003EView this table:\u003C\/span\u003E\u003Cul class=\u0022callout-links\u0022\u003E\u003Cli class=\u0022view-inline first\u0022\u003E\u003Ca href=\u0022\u0022 class=\u0022table-expand-inline\u0022 data-table-url=\u0022\/highwire\/markup\/1184185\/expansion?postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0026amp;table-expand-inline=1\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView inline\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022view-popup\u0022\u003E\u003Ca href=\u0022\/highwire\/markup\/1184185\/expansion?width=1000\u0026amp;height=500\u0026amp;iframe=true\u0026amp;postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0022 class=\u0022colorbox colorbox-load table-expand-popup\u0022 rel=\u0022gallery-fragment-tables\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView popup\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022download-ppt last\u0022\u003E\u003Ca href=\u0022\/highwire\/powerpoint\/1184185\u0022 class=\u0022highwire-figure-link highwire-figure-link-ppt\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload powerpoint\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv class=\u0022table-caption\u0022\u003E\u003Cspan class=\u0022table-label\u0022\u003ETable 1.\u003C\/span\u003E \u003Cspan class=\u0022caption-title\u0022\u003EClinical variables extracted from the electronic medical record and evaluation metrics.\u003C\/span\u003E\u003Cp id=\u0022p-23\u0022 class=\u0022first-child\u0022\u003EDate-based variables were evaluated using concordance within \u00b190 days in the primary analysis, with sensitivity analyses using alternate thresholds. Categorical variables were evaluated using exact concordance. Systemic therapy abstraction included both exact lines of therapy and component anti-cancer drugs, as well as matched-line start and stop dates, treatment intent, and reason for discontinuation. For genetic testing we had access to the files from Foundation Medicine and from the companies doing the germline genetic testing and so this was used as the reference.\u003C\/p\u003E\u003Cp id=\u0022p-24\u0022\u003E^ Patient-level mean Jaccard similarity was used as the benchmark for inter-expert agreement in systemic therapy abstraction.\u003C\/p\u003E\u003Cp id=\u0022p-25\u0022\u003E# For analysis, discontinuation reasons were collapsed to disease progression versus other. Progression included documented progressive disease, hospice enrollment related to advancing cancer, death, or decline in performance status in the setting of progressing disease. Other included planned completion, toxicity or adverse event, patient preference, clinician choice, and transfer of care.\u003C\/p\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv id=\u0022T2\u0022 class=\u0022table pos-float\u0022\u003E\u003Cdiv class=\u0022table-inline table-callout-links\u0022\u003E\u003Cdiv class=\u0022callout\u0022\u003E\u003Cspan\u003EView this table:\u003C\/span\u003E\u003Cul class=\u0022callout-links\u0022\u003E\u003Cli class=\u0022view-inline first\u0022\u003E\u003Ca href=\u0022\u0022 class=\u0022table-expand-inline\u0022 data-table-url=\u0022\/highwire\/markup\/1184180\/expansion?postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0026amp;table-expand-inline=1\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView inline\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022view-popup\u0022\u003E\u003Ca href=\u0022\/highwire\/markup\/1184180\/expansion?width=1000\u0026amp;height=500\u0026amp;iframe=true\u0026amp;postprocessors=highwire_tables%2Chighwire_reclass%2Chighwire_figures%2Chighwire_math%2Chighwire_inline_linked_media%2Chighwire_embed\u0022 class=\u0022colorbox colorbox-load table-expand-popup\u0022 rel=\u0022gallery-fragment-tables\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EView popup\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022download-ppt last\u0022\u003E\u003Ca href=\u0022\/highwire\/powerpoint\/1184180\u0022 class=\u0022highwire-figure-link highwire-figure-link-ppt\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload powerpoint\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv class=\u0022table-caption\u0022\u003E\u003Cspan class=\u0022table-label\u0022\u003ETable 2.\u003C\/span\u003E \u003Cspan class=\u0022caption-title\u0022\u003ECohort characteristics.\u003C\/span\u003E\u003Cp id=\u0022p-26\u0022 class=\u0022first-child\u0022\u003EClinical characteristics from the first expert derived dataset of the 100-patient breast cancer cohort and measures of chart complexity and size.\u003C\/p\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv id=\u0022sec-8\u0022 class=\u0022subsection\u0022\u003E\u003Ch3\u003EStudy cohort and data extraction\u003C\/h3\u003E\u003Cp id=\u0022p-27\u0022\u003EWe randomly selected 100 patients from an institutional database of patients with breast cancer who had undergone either tissue or blood-based FoundationOne testing (Foundation Medicine, Cambridge, MA, USA).\u003Csup\u003E\u003Ca id=\u0022xref-ref-16-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-16\u0022\u003E16\u003C\/a\u003E\u003C\/sup\u003E This intentionally enriched the sample for complex disease trajectories while preserving heterogeneity in documentation patterns and treating clinicians across the academic flagship campus and a community-affiliate practice.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv id=\u0022sec-9\u0022 class=\u0022subsection\u0022\u003E\u003Ch3\u003EReference standard generation and human comparators\u003C\/h3\u003E\u003Cp id=\u0022p-28\u0022\u003EFour medical oncologists specializing in breast cancer care (JCD, NHD, MBM, and JLC) were each assigned a random subset of patients and asked to abstract the variables listed in \u003Ca id=\u0022xref-table-wrap-1-2\u0022 class=\u0022xref-table\u0022 href=\u0022#T1\u0022\u003ETable 1\u003C\/a\u003E. They were instructed to use all available data in the medical record, excluding external notes accessible only through Epic\u2019s external note viewer Care Everywhere (Epic Systems, Verona, WI, USA).\u003Csup\u003E\u003Ca id=\u0022xref-ref-17-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-17\u0022\u003E17\u003C\/a\u003E\u003C\/sup\u003E Experts were provided the clinical definitions used in the study (Supplementary Methods), but were not told how to abstract the variables.\u003C\/p\u003E\u003Cp id=\u0022p-29\u0022\u003EFor most clinical variables, a single expert abstraction served as the reference standard. Because systemic therapy abstraction was expected to be the most difficult task, and the hardest to directly measure, a second oncologist independently abstracted the same systemic therapy variables for each patient. This allowed inter-expert variability, rather than a single ground truth, to serve as the benchmark for performance. Experts were asked to reconstruct lines of therapy, list their component drugs, assign start and stop dates, classify treatment intent as curative or palliative, and determine whether discontinuation was due to disease progression or another reason such as toxicity or patient preference.\u003C\/p\u003E\u003Cp id=\u0022p-30\u0022\u003EAs an additional point of comparison, research coordinators had previously abstracted the original date of diagnosis, the date of distant metastatic disease, and the same systemic therapy variables. Because the research coordinator abstraction was performed in 2022, all comparisons involving research coordinators were censored on June 1, 2022.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv id=\u0022sec-10\u0022 class=\u0022subsection\u0022\u003E\u003Ch3\u003ELLM abstraction pipeline overview\u003C\/h3\u003E\u003Cp id=\u0022p-31\u0022\u003EA detailed description of the pipeline is in the Supplement and GitHub repository (\u003Ca id=\u0022xref-fig-1-1\u0022 class=\u0022xref-fig\u0022 href=\u0022#F1\u0022\u003EFigure 1\u003C\/a\u003E). On January 10, 2026, we downloaded all available text-based electronic medical record documents for each patient from Stanford\u2019s research warehouse.\u003Csup\u003E\u003Ca id=\u0022xref-ref-18-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-18\u0022\u003E18\u003C\/a\u003E\u003C\/sup\u003E Pathology reports, demographics, clinical notes, and medication administration records were exported as separate CSV files, with one row per document and one folder per patient. Original metadata, including document type, author, and entry date, were preserved. The warehouse does not preserve images, scanned documents, or screenshots in the notes. No preprocessing, normalization, or cleaning of source documents was performed before ingestion into the pipeline.\u003C\/p\u003E\u003Cdiv id=\u0022F1\u0022 class=\u0022fig pos-float type-figure  odd\u0022\u003E\u003Cdiv class=\u0022highwire-figure\u0022\u003E\u003Cdiv class=\u0022fig-inline-img-wrapper\u0022\u003E\u003Cdiv class=\u0022fig-inline-img\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F1.large.jpg?width=800\u0026amp;height=600\u0026amp;carousel=1\u0022 title=\u0022Fully Automated Chart Abstraction Workflow. Text documents from the electronic medical record were exported from the institutional research warehouse, segmented into chunks, and indexed for exact-word, BM25, and semantic retrieval. For each task, retrieved text was then passed to commercially available LLMs using schema-constrained prompts to generate structured outputs.\u0022 class=\u0022highwire-fragment fragment-images colorbox-load\u0022 rel=\u0022gallery-fragment-images-750607719\u0022 data-figure-caption=\u0022\u0026lt;div class=\u0026quot;highwire-markup\u0026quot;\u0026gt;\u0026lt;span xmlns=\u0026quot;http:\/\/www.w3.org\/1999\/xhtml\u0026quot; class=\u0026quot;caption-title\u0026quot;\u0026gt;Fully Automated Chart Abstraction Workflow.\u0026lt;\/span\u0026gt; Text documents from the electronic medical record were exported from the institutional research warehouse, segmented into chunks, and indexed for exact-word, BM25, and semantic retrieval. For each task, retrieved text was then passed to commercially available LLMs using schema-constrained prompts to generate structured outputs.\u0026lt;\/div\u0026gt;\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003E\u003Cspan class=\u0022hw-responsive-img\u0022\u003E\u003Cimg class=\u0022highwire-fragment fragment-image lazyload\u0022 alt=\u0022Figure 1.\u0022 src=\u0022data:image\/gif;base64,R0lGODlhAQABAIAAAAAAAP\/\/\/yH5BAEAAAAALAAAAAABAAEAAAIBRAA7\u0022 data-src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F1.medium.gif\u0022 width=\u0022440\u0022 height=\u0022117\u0022\/\u003E\u003Cnoscript\u003E\u003Cimg class=\u0022highwire-fragment fragment-image\u0022 alt=\u0022Figure 1.\u0022 src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F1.medium.gif\u0022 width=\u0022440\u0022 height=\u0022117\u0022\/\u003E\u003C\/noscript\u003E\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cul class=\u0022highwire-figure-links inline\u0022\u003E\u003Cli class=\u0022download-fig first\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F1.large.jpg?download=true\u0022 class=\u0022highwire-figure-link highwire-figure-link-download\u0022 title=\u0022Download Figure 1.\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload figure\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022new-tab last\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F1.large.jpg\u0022 class=\u0022highwire-figure-link highwire-figure-link-newtab\u0022 target=\u0022_blank\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EOpen in new tab\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003Cdiv class=\u0022fig-caption\u0022 xmlns:xhtml=\u0022http:\/\/www.w3.org\/1999\/xhtml\u0022\u003E\u003Cspan class=\u0022fig-label\u0022\u003EFigure 1.\u003C\/span\u003E \u003Cspan class=\u0022caption-title\u0022\u003EFully Automated Chart Abstraction Workflow.\u003C\/span\u003E\u003Cp id=\u0022p-32\u0022 class=\u0022first-child\u0022\u003EText documents from the electronic medical record were exported from the institutional research warehouse, segmented into chunks, and indexed for exact-word, BM25, and semantic retrieval. For each task, retrieved text was then passed to commercially available LLMs using schema-constrained prompts to generate structured outputs.\u003C\/p\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cp id=\u0022p-33\u0022\u003EThe pipeline takes each narrative document and segments it into chunks approximating paragraph-length excerpts. These then can be retrieved and passed to the LLM with a task-specific prompt. Chunks are embedded to enable semantic retrieval.\u003Csup\u003E\u003Ca id=\u0022xref-ref-19-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-19\u0022\u003E19\u003C\/a\u003E\u003C\/sup\u003E For each variable in \u003Ca id=\u0022xref-table-wrap-1-3\u0022 class=\u0022xref-table\u0022 href=\u0022#T1\u0022\u003ETable 1\u003C\/a\u003E, retrieval was restricted to the document types most relevant to manual abstraction of that variable, and custom prompts were used for each variable. For example, for the dates of diagnosis, pathology reports were used first, followed by clinical notes. Retrieval used a combination of search strategies to find candidate text chunks including exact word search, BM25, and semantic embedding queries depending on the variable (Supplementary Table S1).\u003Csup\u003E\u003Ca id=\u0022xref-ref-20-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-20\u0022\u003E20\u003C\/a\u003E,\u003Ca id=\u0022xref-ref-21-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-21\u0022\u003E21\u003C\/a\u003E\u003C\/sup\u003E\u003C\/p\u003E\u003Cp id=\u0022p-34\u0022\u003ERetrieved text chunks were then provided to HIPAA-compliant, commercially available LLMs. We evaluated GPT-5, GPT-4o, DeepSeek-R1, and Gemini 2.5 Pro through Stanford\u2019s SecureGPT platform.\u003Csup\u003E\u003Ca id=\u0022xref-ref-22-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-22\u0022\u003E22\u003C\/a\u003E\u003C\/sup\u003E Prompts and the evidence sent to the LLMs were identical for each task. Tasks were stateless (i.e. no chat history), but for multi-pass tasks, intermediate outputs were carried forward. After pilot development, prompts, retrieval parameters, and task-specific workflows were fixed before final model evaluation. For a given task, all models received identical text chunks and prompts. The LLMs had no access to expert annotations nor structured reference data.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv id=\u0022sec-11\u0022 class=\u0022subsection\u0022\u003E\u003Ch3\u003EOutcomes and statistical analysis\u003C\/h3\u003E\u003Cp id=\u0022p-35\u0022\u003EThe primary endpoints of this descriptive study were agreement between LLM-derived and expert-derived abstraction for recurrence dates and lines of systemic therapy. We also evaluated the concordance for the additional variables listed in \u003Ca id=\u0022xref-table-wrap-1-4\u0022 class=\u0022xref-table\u0022 href=\u0022#T1\u0022\u003ETable 1\u003C\/a\u003E. For all non-drug variables, we prespecified greater than 90% agreement with expert-derived data for at least two LLMs as an arbitrary threshold for encouraging performance. For date-based variables, agreement was defined as concordance within \u00b1 90 days, which we prespecified as a clinically meaningful threshold and examined \u00b1 30 days for select variables. Categorical variables required exact concordance. For mutation testing, the primary analysis focused on mutation presence, with all other outcomes treated as negative or not found.\u003C\/p\u003E\u003Cp id=\u0022p-36\u0022\u003EFor prescribed systemic therapy, we evaluated both exact lines of therapy and the anti-cancer drugs contained within those lines. We prespecified inter-oncologist variability as the benchmark for systemic therapy performance. We considered overlap of the confidence intervals for patient-level mean Jaccard similarity between at least two LLMs and the second oncologist as encouraging performance.\u003Csup\u003E\u003Ca id=\u0022xref-ref-23-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-23\u0022\u003E23\u003C\/a\u003E\u003C\/sup\u003E After therapy-name normalization, predicted and reference lines were matched using a greedy one-to-one algorithm based on temporal proximity. We also calculated precision, recall, and F1 score for both line-level and drug-level extraction. Additional analyses included agreement on the number of therapy lines and, among matched lines, agreement on start and stop dates within \u00b1 30 days, treatment intent, and reason for discontinuation.\u003C\/p\u003E\u003Cp id=\u0022p-37\u0022\u003EAfter abstraction, we created two separate analytic datasets: one fully LLM-derived and one expert-derived. We then examined overall survival from initial breast cancer diagnosis and invasive recurrence-free survival. Censoring was done at the last note in the chart. Differences in survival were measured using log-rank tests and visualized with Kaplan\u2013Meier curves. Because death registry linkage was not used, and less than half the cohort had a documented death date in the ground truth data, we conservatively estimated survival by assuming that patients without a recorded death date were dead at their last clinical follow-up. The standard Kaplan-Meier censoring approach is also presented.\u003Csup\u003E\u003Ca id=\u0022xref-ref-24-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-24\u0022\u003E24\u003C\/a\u003E\u003C\/sup\u003E To compare effect estimates in human-derived and LLM-derived datasets, we evaluated univariate hazard ratio estimates for stage (4 vs 1 \u2013 3) and hormone receptor status (negative vs positive) on overall survival and recurrence-free survival for the early stage patients. We compared hazard ratio estimates and 95% confidence intervals from expert-derived and LLM-derived datasets and used Cochran\u2019s Q test as a formal test for heterogeneity between effect estimates.\u003C\/p\u003E\u003Cp id=\u0022p-38\u0022\u003EConfidence intervals (CIs) for all agreement and performance metrics were estimated using bias-corrected and accelerated bootstrap resampling at the patient level with 1,000 iterations.\u003Csup\u003E\u003Ca id=\u0022xref-ref-25-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-25\u0022\u003E25\u003C\/a\u003E\u003C\/sup\u003E All analyses were conducted in R version 4.5.2 (R Foundation for Statistical Computing, Vienna, Austria) using base functions and the \u003Cem\u003Eboot\u003C\/em\u003E and \u003Cem\u003Esurvival\u003C\/em\u003E packages. The analytic code is available on GitHub.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv id=\u0022sec-12\u0022 class=\u0022subsection\u0022\u003E\u003Ch3\u003EExternal Validation in Young Breast Cancer Patients\u003C\/h3\u003E\u003Cp id=\u0022p-39\u0022\u003ETo examine performance in a clinically distinct population, we evaluated a previously manually abstracted cohort of young patients diagnosed with breast cancer before becoming pregnant.\u003Csup\u003E\u003Ca id=\u0022xref-ref-26-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-26\u0022\u003E26\u003C\/a\u003E\u003C\/sup\u003E We compared recurrence detection and receipt of adjuvant endocrine therapy for patients who had an initial invasive diagnosis and hormone receptor\u2013positive disease. We compared expert-abstraction to the two best performing LLMs. The pipeline, retrieval strategy, and prompts were applied to this cohort without modification.\u003C\/p\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-13\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EResults\u003C\/h2\u003E\u003Cp id=\u0022p-40\u0022\u003EFor simplicity, the main text focuses on the two LLMs that performed best overall; results for all four models are in Supplementary Figure S1 and Supplementary Table S2.\u003C\/p\u003E\u003Cp id=\u0022p-41\u0022\u003EThe 100-patient cohort was complex with around 1,100 individual drugs prescribed in a median of 7 lines of therapy (interquartile range [IQR], 4.75 \u2013 9) over 6.5 years of follow-up from diagnosis (IQR, 3.7 \u2013 9.9 years). The median chart size was approximately 2.3 million tokens or roughly 3,100 pages of text. The average time to process an individual patient ranged from 1 \u2013 11 minutes (Supplementary Table S7).\u003C\/p\u003E\u003Cdiv id=\u0022sec-14\u0022 class=\u0022subsection\u0022\u003E\u003Ch3\u003EAgreement for non-systemic therapy variables\u003C\/h3\u003E\u003Cp id=\u0022p-42\u0022\u003EAcross non-systemic variables, the pipeline showed high agreement with expert oncologist abstraction (\u003Ca id=\u0022xref-fig-2-1\u0022 class=\u0022xref-fig\u0022 href=\u0022#F2\u0022\u003EFigure 2\u003C\/a\u003E; Supplementary Figure S1; Supplementary Table S2). The two best-LLMs achieved at least 90% agreement across all 13 variables. Agreement was highest for variables anchored to pathology reports or demographic data. Variables with heterogeneous documentation, those requiring longitudinal reasoning such as stage assignment, and variables often available only in scanned PDFs or screenshots not retained in the research warehouse had lower agreement (\u003Ca id=\u0022xref-fig-2-2\u0022 class=\u0022xref-fig\u0022 href=\u0022#F2\u0022\u003EFigure 2\u003C\/a\u003E; Supplementary Table S6).\u003C\/p\u003E\u003Cdiv id=\u0022F2\u0022 class=\u0022fig pos-float type-figure  odd\u0022\u003E\u003Cdiv class=\u0022highwire-figure\u0022\u003E\u003Cdiv class=\u0022fig-inline-img-wrapper\u0022\u003E\u003Cdiv class=\u0022fig-inline-img\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F2.large.jpg?width=800\u0026amp;height=600\u0026amp;carousel=1\u0022 title=\u0022Agreement with expert oncologist abstraction across key clinical variables. Forest plot showing agreement with expert oncologist abstraction and 95% bootstrap confidence intervals for the best and second-best performing LLMs across key clinical variables. Research coordinators are shown for variables they previously abstracted. Date-based variables were evaluated using concordance within \u0026#xB1; 90 days. Categorical variables were evaluated using exact concordance. * Treatment intent and reason for discontinuation were evaluated only among matched therapy lines; evaluable denominators were n = 651 for the second oncologist, n = 645 for Gemini, n = 620 for GPT-5, and n = 551 for the research coordinator.\u0022 class=\u0022highwire-fragment fragment-images colorbox-load\u0022 rel=\u0022gallery-fragment-images-750607719\u0022 data-figure-caption=\u0022\u0026lt;div class=\u0026quot;highwire-markup\u0026quot;\u0026gt;\u0026lt;span xmlns=\u0026quot;http:\/\/www.w3.org\/1999\/xhtml\u0026quot; class=\u0026quot;caption-title\u0026quot;\u0026gt;Agreement with expert oncologist abstraction across key clinical variables.\u0026lt;\/span\u0026gt; Forest plot showing agreement with expert oncologist abstraction and 95% bootstrap confidence intervals for the best and second-best performing LLMs across key clinical variables. Research coordinators are shown for variables they previously abstracted. Date-based variables were evaluated using concordance within \u0026#xB1; 90 days. Categorical variables were evaluated using exact concordance. * Treatment intent and reason for discontinuation were evaluated only among matched therapy lines; evaluable denominators were n = 651 for the second oncologist, n = 645 for Gemini, n = 620 for GPT-5, and n = 551 for the research coordinator.\u0026lt;\/div\u0026gt;\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003E\u003Cspan class=\u0022hw-responsive-img\u0022\u003E\u003Cimg class=\u0022highwire-fragment fragment-image lazyload\u0022 alt=\u0022Figure 2.\u0022 src=\u0022data:image\/gif;base64,R0lGODlhAQABAIAAAAAAAP\/\/\/yH5BAEAAAAALAAAAAABAAEAAAIBRAA7\u0022 data-src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F2.medium.gif\u0022 width=\u0022381\u0022 height=\u0022440\u0022\/\u003E\u003Cnoscript\u003E\u003Cimg class=\u0022highwire-fragment fragment-image\u0022 alt=\u0022Figure 2.\u0022 src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F2.medium.gif\u0022 width=\u0022381\u0022 height=\u0022440\u0022\/\u003E\u003C\/noscript\u003E\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cul class=\u0022highwire-figure-links inline\u0022\u003E\u003Cli class=\u0022download-fig first\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F2.large.jpg?download=true\u0022 class=\u0022highwire-figure-link highwire-figure-link-download\u0022 title=\u0022Download Figure 2.\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload figure\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022new-tab last\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F2.large.jpg\u0022 class=\u0022highwire-figure-link highwire-figure-link-newtab\u0022 target=\u0022_blank\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EOpen in new tab\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003Cdiv class=\u0022fig-caption\u0022\u003E\u003Cspan class=\u0022fig-label\u0022\u003EFigure 2.\u003C\/span\u003E \u003Cspan class=\u0022caption-title\u0022\u003EAgreement with expert oncologist abstraction across key clinical variables.\u003C\/span\u003E\u003Cp id=\u0022p-43\u0022 class=\u0022first-child\u0022\u003EForest plot showing agreement with expert oncologist abstraction and 95% bootstrap confidence intervals for the best and second-best performing LLMs across key clinical variables. Research coordinators are shown for variables they previously abstracted. Date-based variables were evaluated using concordance within \u00b1 90 days. Categorical variables were evaluated using exact concordance.\u003C\/p\u003E\u003Cp id=\u0022p-44\u0022\u003E* Treatment intent and reason for discontinuation were evaluated only among matched therapy lines; evaluable denominators were n = 651 for the second oncologist, n = 645 for Gemini, n = 620 for GPT-5, and n = 551 for the research coordinator.\u003C\/p\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cp id=\u0022p-45\u0022\u003EFor the original diagnosis date, the two best-performing LLMs agreed with the expert on more than 97% of patients. No original diagnosis dates differed by more than 1 year (Supplementary Figure S2). For metastatic recurrence, agreement within \u00b1 90 days was 90% and 96% for the two best-performing LLMs; 90% and 82% of recurrence dates were within 30 days. Locoregional recurrence had high date concordance (Supplementary Figure S2), but with more false negatives than metastatic recurrence. The two best-performing LLMs missed 3 and 5 events, respectively. In the 6 total unique cases, the LLMs had classified the recurrence as distant metastatic rather than locoregional. Full model-by-model results are shown in Supplementary Table S2, with an expanded forest plot in Supplementary Figure S1, confusion matrices for stage and hormone receptor and HER2 status in Supplementary Figure S3, and a qualitative error analysis in Supplementary Table S6.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv id=\u0022sec-15\u0022 class=\u0022subsection\u0022\u003E\u003Ch3\u003ESystemic therapy abstraction relative to inter-expert variability\u003C\/h3\u003E\u003Cp id=\u0022p-46\u0022\u003ECompared with the first expert oncologist, the second oncologist achieved a mean patient-level Jaccard similarity of 0.95 (95% CI, 0.92 to 0.96) for all prescribed anti-cancer drugs and 0.86 (95% CI, 0.81 to 0.89) for reconstructing the exact lines of therapy (\u003Ca id=\u0022xref-fig-4-1\u0022 class=\u0022xref-fig\u0022 href=\u0022#F4\u0022\u003EFigure 4\u003C\/a\u003E; Supplementary Tables S2 and S3). Among matched lines (n = 651), oncologist agreement was 93% for treatment intent, 92% for reason for discontinuation, 98% for start date within \u00b1 30 days, and 90% for stop date within \u00b1 30 days.\u003C\/p\u003E\u003Cdiv id=\u0022F3\u0022 class=\u0022fig pos-float type-figure  odd\u0022\u003E\u003Cdiv class=\u0022highwire-figure\u0022\u003E\u003Cdiv class=\u0022fig-inline-img-wrapper\u0022\u003E\u003Cdiv class=\u0022fig-inline-img\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F3.large.jpg?width=800\u0026amp;height=600\u0026amp;carousel=1\u0022 title=\u0022Survival estimates derived from expert versus LLM chart abstraction. Kaplan\u0026#x2013;Meier curves comparing survival estimates generated from fully expert-derived data and fully LLM-derived data for the two best-performing LLMs. Solid curves show a conservative lower bound analysis where censoring is assumed to represent death\/recurrence. The dashed curves show the standard Kaplan\u0026#x2013;Meier approach with censoring at last follow-up for comparison. (A) Overall survival. (B) Invasive recurrence-free survival among patients with stage 1 \u0026#x2013; 3 diseases. Differences between expert and LLM curves were separately assessed using log-rank tests.\u0022 class=\u0022highwire-fragment fragment-images colorbox-load\u0022 rel=\u0022gallery-fragment-images-750607719\u0022 data-figure-caption=\u0022\u0026lt;div class=\u0026quot;highwire-markup\u0026quot;\u0026gt;\u0026lt;span xmlns=\u0026quot;http:\/\/www.w3.org\/1999\/xhtml\u0026quot; class=\u0026quot;caption-title\u0026quot;\u0026gt;Survival estimates derived from expert versus LLM chart abstraction.\u0026lt;\/span\u0026gt; Kaplan\u0026#x2013;Meier curves comparing survival estimates generated from fully expert-derived data and fully LLM-derived data for the two best-performing LLMs. Solid curves show a conservative lower bound analysis where censoring is assumed to represent death\/recurrence. The dashed curves show the standard Kaplan\u0026#x2013;Meier approach with censoring at last follow-up for comparison. (A) Overall survival. (B) Invasive recurrence-free survival among patients with stage 1 \u0026#x2013; 3 diseases. Differences between expert and LLM curves were separately assessed using log-rank tests.\u0026lt;\/div\u0026gt;\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003E\u003Cspan class=\u0022hw-responsive-img\u0022\u003E\u003Cimg class=\u0022highwire-fragment fragment-image lazyload\u0022 alt=\u0022Figure 3.\u0022 src=\u0022data:image\/gif;base64,R0lGODlhAQABAIAAAAAAAP\/\/\/yH5BAEAAAAALAAAAAABAAEAAAIBRAA7\u0022 data-src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F3.medium.gif\u0022 width=\u0022440\u0022 height=\u0022177\u0022\/\u003E\u003Cnoscript\u003E\u003Cimg class=\u0022highwire-fragment fragment-image\u0022 alt=\u0022Figure 3.\u0022 src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F3.medium.gif\u0022 width=\u0022440\u0022 height=\u0022177\u0022\/\u003E\u003C\/noscript\u003E\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cul class=\u0022highwire-figure-links inline\u0022\u003E\u003Cli class=\u0022download-fig first\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F3.large.jpg?download=true\u0022 class=\u0022highwire-figure-link highwire-figure-link-download\u0022 title=\u0022Download Figure 3.\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload figure\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022new-tab last\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F3.large.jpg\u0022 class=\u0022highwire-figure-link highwire-figure-link-newtab\u0022 target=\u0022_blank\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EOpen in new tab\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003Cdiv class=\u0022fig-caption\u0022\u003E\u003Cspan class=\u0022fig-label\u0022\u003EFigure 3.\u003C\/span\u003E \u003Cspan class=\u0022caption-title\u0022\u003ESurvival estimates derived from expert versus LLM chart abstraction.\u003C\/span\u003E\u003Cp id=\u0022p-47\u0022 class=\u0022first-child\u0022\u003EKaplan\u2013Meier curves comparing survival estimates generated from fully expert-derived data and fully LLM-derived data for the two best-performing LLMs. Solid curves show a conservative lower bound analysis where censoring is assumed to represent death\/recurrence. The dashed curves show the standard Kaplan\u2013Meier approach with censoring at last follow-up for comparison. (A) Overall survival. (B) Invasive recurrence-free survival among patients with stage 1 \u2013 3 diseases. Differences between expert and LLM curves were separately assessed using log-rank tests.\u003C\/p\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv id=\u0022F4\u0022 class=\u0022fig pos-float type-figure  odd\u0022\u003E\u003Cdiv class=\u0022highwire-figure\u0022\u003E\u003Cdiv class=\u0022fig-inline-img-wrapper\u0022\u003E\u003Cdiv class=\u0022fig-inline-img\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F4.large.jpg?width=800\u0026amp;height=600\u0026amp;carousel=1\u0022 title=\u0022Patient-level overlap in systemic therapy abstraction. Violin plots showing patient-level Jaccard similarity for abstraction of all prescribed anti-cancer drugs (Panel A) and exact therapy lines (Panel B). Diamonds indicate medians and bars are the interquartile ranges. Results are shown for the second oncologist, the two best-performing LLMs, and research coordinators relative to the expert oncologist reference.\u0022 class=\u0022highwire-fragment fragment-images colorbox-load\u0022 rel=\u0022gallery-fragment-images-750607719\u0022 data-figure-caption=\u0022\u0026lt;div class=\u0026quot;highwire-markup\u0026quot;\u0026gt;\u0026lt;span xmlns=\u0026quot;http:\/\/www.w3.org\/1999\/xhtml\u0026quot; class=\u0026quot;caption-title\u0026quot;\u0026gt;Patient-level overlap in systemic therapy abstraction.\u0026lt;\/span\u0026gt; Violin plots showing patient-level Jaccard similarity for abstraction of all prescribed anti-cancer drugs (Panel A) and exact therapy lines (Panel B). Diamonds indicate medians and bars are the interquartile ranges. Results are shown for the second oncologist, the two best-performing LLMs, and research coordinators relative to the expert oncologist reference.\u0026lt;\/div\u0026gt;\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003E\u003Cspan class=\u0022hw-responsive-img\u0022\u003E\u003Cimg class=\u0022highwire-fragment fragment-image lazyload\u0022 alt=\u0022Figure 4.\u0022 src=\u0022data:image\/gif;base64,R0lGODlhAQABAIAAAAAAAP\/\/\/yH5BAEAAAAALAAAAAABAAEAAAIBRAA7\u0022 data-src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F4.medium.gif\u0022 width=\u0022395\u0022 height=\u0022440\u0022\/\u003E\u003Cnoscript\u003E\u003Cimg class=\u0022highwire-fragment fragment-image\u0022 alt=\u0022Figure 4.\u0022 src=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F4.medium.gif\u0022 width=\u0022395\u0022 height=\u0022440\u0022\/\u003E\u003C\/noscript\u003E\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cul class=\u0022highwire-figure-links inline\u0022\u003E\u003Cli class=\u0022download-fig first\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F4.large.jpg?download=true\u0022 class=\u0022highwire-figure-link highwire-figure-link-download\u0022 title=\u0022Download Figure 4.\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EDownload figure\u003C\/a\u003E\u003C\/li\u003E\u003Cli class=\u0022new-tab last\u0022\u003E\u003Ca href=\u0022https:\/\/www.medrxiv.org\/content\/medrxiv\/early\/2026\/03\/25\/2026.03.23.26349012\/F4.large.jpg\u0022 class=\u0022highwire-figure-link highwire-figure-link-newtab\u0022 target=\u0022_blank\u0022 data-icon-position=\u0022\u0022 data-hide-link-title=\u00220\u0022\u003EOpen in new tab\u003C\/a\u003E\u003C\/li\u003E\u003C\/ul\u003E\u003C\/div\u003E\u003Cdiv class=\u0022fig-caption\u0022\u003E\u003Cspan class=\u0022fig-label\u0022\u003EFigure 4.\u003C\/span\u003E \u003Cspan class=\u0022caption-title\u0022\u003EPatient-level overlap in systemic therapy abstraction.\u003C\/span\u003E\u003Cp id=\u0022p-48\u0022 class=\u0022first-child\u0022\u003EViolin plots showing patient-level Jaccard similarity for abstraction of all prescribed anti-cancer drugs (Panel A) and exact therapy lines (Panel B). Diamonds indicate medians and bars are the interquartile ranges. Results are shown for the second oncologist, the two best-performing LLMs, and research coordinators relative to the expert oncologist reference.\u003C\/p\u003E\u003Cdiv class=\u0022sb-div caption-clear\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cp id=\u0022p-49\u0022\u003EThe LLMs had a similar mean patient-level Jaccard similarity of 0.91 (95% CI, 0.89 to 0.93) and 0.90 (95% CI, 0.87 to 0.92) for prescribed anti-cancer drugs with CIs that overlapped those of the second oncologist. For lines of therapy, they were notably lower at 0.77 (95% CI, 0.72 to 0.81) and 0.73 (95% CI, 0.69 to 0.78). When the two best-performing LLMs were compared with each other, they disagreed to a similar extent as the two expert oncologists did with Jaccard similarities of 0.96 (95% CI, 0.94 to 0.98) for drugs and 0.84 (95% CI, 0.79 to 0.87) for lines of therapy. Violin plots for all four LLMs are shown in Supplementary Figure S6.\u003C\/p\u003E\u003Cp id=\u0022p-50\u0022\u003EResearch coordinators performed worse than all LLMs on systemic therapy abstraction, with a patient-level Jaccard similarity of 0.70 (95% CI, 0.67 to 0.74) for prescribed anti-cancer drugs and 0.53 (95% CI, 0.49 to 0.58) for the lines of therapy. Even after we post hoc collapsed all aromatase inhibitors and all taxanes into single entities, research coordinators still had worse performance than the worst LLM for line reconstruction (0.65 vs 0.71). Abstraction performance was stable for most LLMs across large and long charts, but performance declined for research coordinators as the chart got bigger (Supplementary Figure S5). A representative treatment timeline for a complex patient is shown in Supplementary Figure S4.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv id=\u0022sec-16\u0022 class=\u0022subsection\u0022\u003E\u003Ch3\u003EPreservation of survival and effect estimates\u003C\/h3\u003E\u003Cp id=\u0022p-51\u0022\u003ECohort level inference for survival was preserved when fully LLM-derived datasets were used in place of fully expert-derived datasets (\u003Ca id=\u0022xref-fig-3-1\u0022 class=\u0022xref-fig\u0022 href=\u0022#F3\u0022\u003EFigure 3\u003C\/a\u003E). Because fewer than half of patients had a documented date of death, overall survival estimates were sensitive to censoring assumptions, with the median in the expert-derived dataset differing by approximately 3 years depending on the censoring rule; \u003Ca id=\u0022xref-fig-3-2\u0022 class=\u0022xref-fig\u0022 href=\u0022#F3\u0022\u003EFigure 3\u003C\/a\u003E\u2019s solid lines uses a conservative approach in which patients without a documented death date are treated as having died at their last clinical follow-up. The dashed lines show traditional censoring at last follow-up. The censoring rule did not change the similarity of survival estimates for LLM and expert. Median overall survival was 78.2 months for the expert and 78.2 months for the two LLMs (log-rank P = 0.99 and 1.00). Median recurrence-free survival was 34.9 months for the expert and 34.9 months for the two LLMs (P = 0.91 and 0.97).\u003C\/p\u003E\u003Cp id=\u0022p-52\u0022\u003EWhen comparing the hazard ratio and confidence intervals for the risk of death for disease stage they were similar for expert-derived and LLM derived datasets: 2.80 (95% CI, 1.57 to 5.00) in the expert-derived dataset, compared with 2.85 (95% CI, 1.38 to 5.86) and 2.58 (95% CI, 1.25 to 5.32) for the best two LLMs. For hormone receptor-negative versus hormone receptor-positive disease, the hazard ratio was 1.86 (95% CI, 1.18 to 2.93) in the expert-derived dataset, compared with estimates that were numerically similar but did cross 1.00 for the LLMs with ratios of 1.66 (95% CI, 0.91 to 3.00) and 1.60 (95% CI, 0.87 to 2.91) in the corresponding LLM-derived datasets. Cochran Q heterogeneity testing did not identify significant differences in these effect estimates (Supplementary Table S5).\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv id=\u0022sec-17\u0022 class=\u0022subsection\u0022\u003E\u003Ch3\u003EExternal Validation in Young Breast Cancer Patients\u003C\/h3\u003E\u003Cp id=\u0022p-53\u0022\u003EIn an external cohort of 97 young patients with hormone receptor\u2013positive invasive breast cancer diagnosed before pregnancy, expert manual abstraction identified 11 recurrences, compared with 13 and 13 identified by the two leading LLMs. One discordant case was an expert error; the other was an LLM error. The LLM error was on the smallest chart in the cohort\u2014there were no Stanfrd notes within 7 years of the documented recurrence event and it could only be identified in outside hospital notes that were not in the research warehouse for data ingestion. Receipt of adjuvant endocrine therapy had an F1 score of 0.99 and 0.96 for the two LLMs.\u003C\/p\u003E\u003C\/div\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-18\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EDiscussion\u003C\/h2\u003E\u003Cp id=\u0022p-54\u0022\u003EIn this retrospective study of 100 patients with complex breast cancer histories, a pipeline using off-the-shelf general-purpose LLMs abstracted clinical variables from the medical record with high concordance with expert oncologists. Concordance was highest for variables anchored to pathology, such as estrogen receptor status, and lowest for variables requiring clinical reasoning, such as why a treatment was stopped. For abstracting the anti-cancer treatments, the best-performing model approached inter-oncologist variability. However, there was a clear difference in how the oncologists and LLMs reconstructed therapy lines. Despite differences at the individual patient level, cohort level survival and hazard ratio estimates were similar when fully LLM-derived datasets were compared to expert-derived datasets.\u003C\/p\u003E\u003Cp id=\u0022p-55\u0022\u003EManual chart abstraction is a major bottleneck in clinical research. Because we write notes in unstructured text, answering many of the clinically meaningful questions is impractical because creating the analytic dataset is too labor-intensive.\u003Csup\u003E\u003Ca id=\u0022xref-ref-5-3\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-5\u0022\u003E5\u003C\/a\u003E\u003C\/sup\u003E We have high uncertainty across many clinical domains even when, in principle, the information needed to answer these questions exists in the medical record. This is especially true for rare and complex diseases, settings with heterogeneous practice patterns, areas in which unreplicated retrospective studies dominate clinical decision-making, and domains with less mature disease registries than cancer. A practical implication of our approach is that it would make conducting multi-institutional cohort studies much easier: institutions can share a validated common abstraction pipeline while keeping patient-level data local.\u003Csup\u003E\u003Ca id=\u0022xref-ref-13-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-13\u0022\u003E13\u003C\/a\u003E\u003C\/sup\u003E Doing this would allow consortiums to build large harmonized cohorts to address a broad range of clinically important questions.\u003C\/p\u003E\u003Cp id=\u0022p-56\u0022\u003EOur results highlight challenges that extend beyond LLMs to any research in which chart review is a central component. Sparse documentation remains a major barrier, particularly in fragmented health systems such as the United States. In health systems with more centralized longitudinal records, we would expect the LLM-pipeline approach to be powerful. As an example, the lack of high-quality death records in our analysis shows how a lack of data integration, and the downstream analytic assumptions, shift results by clinically meaningful amounts. Variables, syndromes, and diseases with ambiguous clinical definitions remain difficult to abstract and to study. Poorly designed abstraction frameworks, whether given to an LLM or a human-abstractor, will generate poor datasets.\u003Csup\u003E\u003Ca id=\u0022xref-ref-27-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-27\u0022\u003E27\u003C\/a\u003E\u003C\/sup\u003E\u003C\/p\u003E\u003Cp id=\u0022p-57\u0022\u003EAs LLM-based abstraction becomes more common, whether through abstractors copying and pasting into chatbots or through validated pipelines, it will be critical to establish norms for study design, transparent definitions, statistical rigor, and benchmarking against domain experts.\u003Csup\u003E\u003Ca id=\u0022xref-ref-28-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-28\u0022\u003E28\u003C\/a\u003E\u003C\/sup\u003E Most retrospective studies are fundamentally correlative and, on their own, do not support causal inference.\u003Csup\u003E\u003Ca id=\u0022xref-ref-29-1\u0022 class=\u0022xref-bibr\u0022 href=\u0022#ref-29\u0022\u003E29\u003C\/a\u003E\u003C\/sup\u003E Scaling abstraction will not get us closer to the truth without corresponding scientific rigor.\u003C\/p\u003E\u003Cp id=\u0022p-58\u0022\u003EThis study has limitations: it was conducted in a single healthcare system and focused on a single disease. Effective abstraction was contingent on the relevant data being present in the record. Errors could be because of a lack of data, badly designed retrievers, badly designed prompts, or LLM reasoning errors. There remains a clear gap between experts and LLMs on the most complex abstraction tasks, although we expect this gap to narrow as the LLMs improve over time (Supplementary Figure S1).\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-19\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EConclusion\u003C\/h2\u003E\u003Cp id=\u0022p-59\u0022\u003EOff-the-shelf general-purpose LLMs in a fixed retrieval pipeline can abstract clinically meaningful variables from complex longitudinal oncology records. Performance was strongest for variables anchored to pathology and lower for ones that required clinical interpretation. Although a gap remained at the individual-patient level, survival and hazard ratio estimates at the cohort level were preserved. These findings suggest that LLM-based abstraction could enable the creation of large research-grade retrospective datasets that were previously impractical to assemble, thereby supporting a broad range of clinical questions. Realizing this potential will require carefully designed abstraction tasks, validated outputs, and cautious interpretation of results.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section data-availability\u0022 id=\u0022sec-21\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EData Availability\u003C\/h2\u003E\u003Cp id=\u0022p-60\u0022\u003EThe analytic code and core abstraction pipeline will be made publicly available on GitHub upon publication.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-22\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EPrior Presentations\u003C\/h2\u003E\u003Cp id=\u0022p-61\u0022\u003EThis work was presented as a poster at American Society of Clinical Oncology Annual Meeting 2025 and the San Antonio Breast Cancer Symposium 2025\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-23\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EFunding\u003C\/h2\u003E\u003Cp id=\u0022p-62\u0022\u003EThis work was supported by the Stanford Center for Digital Health\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-24\u0022\u003E\u003Ch2 class=\u0022\u0022\u003ECompeting Interests \/ Conflicts of Interest\u003C\/h2\u003E\u003Cp id=\u0022p-63\u0022\u003EJCD: Stock Ownership: Johnson \u0026amp; Johnson, Merck. JLC: research funding to her institution from Effector Therapeutics and Novartis.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section\u0022 id=\u0022sec-25\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EData and Code Availability\u003C\/h2\u003E\u003Cp id=\u0022p-65\u0022\u003EThe analytic code and core abstraction pipeline will be made publicly available upon publication. Please contact \u003Cspan class=\u0022em-link\u0022\u003E\u003Cspan class=\u0022em-addr\u0022\u003Ejcdicker{at}stanford.edu\u003C\/span\u003E\u003C\/span\u003E for collaborations and early access to the pipeline.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section ack\u0022 id=\u0022ack-1\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EAcknowledgements\u003C\/h2\u003E\u003Cp id=\u0022p-64\u0022\u003EWe would like to thank our research coordinators Jessica Orford, Sonia Rios-Ventura, and Rozelle Laquindanum.\u003C\/p\u003E\u003C\/div\u003E\u003Cdiv class=\u0022section ref-list\u0022 id=\u0022ref-list-1\u0022\u003E\u003Ch2 class=\u0022\u0022\u003EReferences\u003C\/h2\u003E\u003Col class=\u0022cit-list ref-use-labels\u0022\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E1.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-1-1\u0022 title=\u0022View reference 1. in text\u0022 id=\u0022ref-1\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.1\u0022 data-doi=\u002210.2196\/18143\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EA\u2019Mar\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ET\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EBeatty\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJD\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EFedorenko\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EC\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EIncorporating Breast Cancer Recurrence Events Into Population-Based Cancer Registries Using Medical Claims: Cohort Study\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJMIR Cancer\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-month\u0022\u003EAug\u003C\/span\u003E \u003Cspan class=\u0022cit-day\u0022\u003E17\u003C\/span\u003E \u003Cspan class=\u0022cit-pub-date\u0022\u003E2020\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E6\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E2\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003Ee18143\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.2196\/18143\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJMIR%2BCancer%26rft.volume%253D6%26rft.spage%253D18143e%26rft_id%253Dinfo%253Adoi%252F10.2196%252F18143%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.2196\/18143\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E2.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-2-1\u0022 title=\u0022View reference 2. in text\u0022 id=\u0022ref-2\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.2\u0022 data-doi=\u002210.1200\/cci-25-00143\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ECao\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EJohnson\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EKL\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EFumagalli\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EIA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EIntegrating a Shareable Artificial Intelligence Model Into Clinical Research for Cancer Recurrence in Patients With Breast and Colorectal Cancer\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJCO Clin Cancer Inform\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-month\u0022\u003ENov\u003C\/span\u003E \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E9\u003C\/span\u003E:\u003Cspan class=\u0022cit-fpage\u0022\u003Ee2500143\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1200\/cci-25-00143\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJCO%2BClin%2BCancer%2BInform%26rft.volume%253D9%26rft.spage%253D2500143e%26rft_id%253Dinfo%253Adoi%252F10.1200%252Fcci-25-00143%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1200\/cci-25-00143\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E3.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-3-1\u0022 title=\u0022View reference 3. in text\u0022 id=\u0022ref-3\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.3\u0022 data-doi=\u002210.1093\/jnci\/djaf353\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EJourquin\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJ\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EDickerson\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJC\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EMarks\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EEG\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003ESusan G. Komen\u2019s ShareForCures: a patient-engaged, nationwide breast cancer research registry\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJNCI: Journal of the National Cancer Institute\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E;\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1093\/jnci\/djaf353\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJNCI%253A%2BJournal%2Bof%2Bthe%2BNational%2BCancer%2BInstitute%26rft_id%253Dinfo%253Adoi%252F10.1093%252Fjnci%252Fdjaf353%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1093\/jnci\/djaf353\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E4.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-4-1\u0022 title=\u0022View reference 4. in text\u0022 id=\u0022ref-4\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.4\u0022 data-doi=\u002210.1200\/op-24-00788\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ERiaz\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EF\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EVaughn\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJL\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EZhu\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EH\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EInpatient Immunotherapy Outcomes Study: A Multicenter Retrospective Analysis\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJCO Oncology Practice\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E21\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E8\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E1165\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E1173\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1200\/op-24-00788\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJCO%2BOncology%2BPractice%26rft.volume%253D21%26rft.spage%253D1165%26rft_id%253Dinfo%253Adoi%252F10.1200%252Fop-24-00788%26rft_id%253Dinfo%253Apmid%252F39937997%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1200\/op-24-00788\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=39937997\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2026%2F03%2F25%2F2026.03.23.26349012.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E5.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-5-1\u0022 title=\u0022View reference 5. in text\u0022 id=\u0022ref-5\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.5\u0022 data-doi=\u002210.1093\/jnci\/djv134\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EWarren\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJL\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EYabroff\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EKR\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EChallenges and opportunities in measuring cancer recurrence in the United States\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJ Natl Cancer Inst\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-month\u0022\u003EAug\u003C\/span\u003E \u003Cspan class=\u0022cit-pub-date\u0022\u003E2015\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E107\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E8\u003C\/span\u003E)\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1093\/jnci\/djv134\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJ%2BNatl%2BCancer%2BInst%26rft_id%253Dinfo%253Adoi%252F10.1093%252Fjnci%252Fdjv134%26rft_id%253Dinfo%253Apmid%252F25971299%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1093\/jnci\/djv134\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=25971299\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2026%2F03%2F25%2F2026.03.23.26349012.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E6.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-6-1\u0022 title=\u0022View reference 6. in text\u0022 id=\u0022ref-6\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.6\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth cit-collab\u0022\u003ENIH\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EBreast Cancer Recent Trends in SEER Age-Adjusted Incidence Rates, 2000-2022\u003C\/abbr\u003E. Accessed \u003Cspan class=\u0022cit-date-in-citation\u0022\u003E7\/29\/25\u003C\/span\u003E, \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E. \u003Ca href=\u0022https:\/\/seer.cancer.gov\/statistics-network\/explorer\/application.html?site=55\u0026amp;data_type=1\u0026amp;graph_type=2\u0026amp;compareBy=sex\u0026amp;chk_sex_3=3\u0026amp;chk_sex_2=2\u0026amp;rate_type=2\u0026amp;race=1\u0026amp;age_range=1\u0026amp;stage=101\u0026amp;advopt_precision=1\u0026amp;advopt_show_ci=on\u0026amp;hdn_view=0\u0026amp;advopt_show_apc=on\u0026amp;advopt_display=2#resultsRegion0\u0022\u003Ehttps:\/\/seer.cancer.gov\/statistics-network\/explorer\/application.html?site=55\u0026amp;data_type=1\u0026amp;graph_type=2\u0026amp;compareBy=sex\u0026amp;chk_sex_3=3\u0026amp;chk_sex_2=2\u0026amp;rate_type=2\u0026amp;race=1\u0026amp;age_range=1\u0026amp;stage=101\u0026amp;advopt_precision=1\u0026amp;advopt_show_ci=on\u0026amp;hdn_view=0\u0026amp;advopt_show_apc=on\u0026amp;advopt_display=2#resultsRegion0\u003C\/a\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E7.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-7-1\u0022 title=\u0022View reference 7. in text\u0022 id=\u0022ref-7\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.7\u0022 data-doi=\u002210.1093\/jnci\/djaa050\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EIzci\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EH\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ETambuyzer\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ET\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ETuand\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EK\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EA Systematic Review of Estimating Breast Cancer Recurrence at the Population Level With Administrative Data\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJNCI: Journal of the National Cancer Institute\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2020\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E112\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E10\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E979\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E988\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1093\/jnci\/djaa050\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJNCI%253A%2BJournal%2Bof%2Bthe%2BNational%2BCancer%2BInstitute%26rft.volume%253D112%26rft.spage%253D979%26rft_id%253Dinfo%253Adoi%252F10.1093%252Fjnci%252Fdjaa050%26rft_id%253Dinfo%253Apmid%252F32259259%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1093\/jnci\/djaa050\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=32259259\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2026%2F03%2F25%2F2026.03.23.26349012.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E8.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-8-1\u0022 title=\u0022View reference 8. in text\u0022 id=\u0022ref-8\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.8\u0022 data-doi=\u002210.1158\/1055-9965.EPI-16-0889\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EMariotto\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EAB\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EEtzioni\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ER\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EHurlbert\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EM\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EPenberthy\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EL\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EMayer\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EM\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EEstimation of the Number of Women Living with Metastatic Breast Cancer in the United States\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003ECancer Epidemiol Biomarkers Prev\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-month\u0022\u003EJun\u003C\/span\u003E \u003Cspan class=\u0022cit-pub-date\u0022\u003E2017\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E26\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E6\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E809\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E815\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1158\/1055-9965.Epi-16-0889\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DCancer%2BEpidemiol%2BBiomarkers%2BPrev%26rft_id%253Dinfo%253Adoi%252F10.1158%252F1055-9965.EPI-16-0889%26rft_id%253Dinfo%253Apmid%252F28522448%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/ijlink\/YTozOntzOjQ6InBhdGgiO3M6MTQ6Ii9sb29rdXAvaWpsaW5rIjtzOjU6InF1ZXJ5IjthOjQ6e3M6ODoibGlua1R5cGUiO3M6NDoiQUJTVCI7czoxMToiam91cm5hbENvZGUiO3M6NDoiY2VicCI7czo1OiJyZXNpZCI7czo4OiIyNi82LzgwOSI7czo0OiJhdG9tIjtzOjUwOiIvbWVkcnhpdi9lYXJseS8yMDI2LzAzLzI1LzIwMjYuMDMuMjMuMjYzNDkwMTIuYXRvbSI7fXM6ODoiZnJhZ21lbnQiO3M6MDoiIjt9\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-ijlink\u0022\u003E\u003Cspan\u003E\u003Cspan class=\u0022cit-reflinks-abstract\u0022\u003EAbstract\u003C\/span\u003E\u003Cspan class=\u0022cit-sep cit-reflinks-variant-name-sep\u0022\u003E\/\u003C\/span\u003E\u003Cspan class=\u0022cit-reflinks-full-text\u0022\u003E\u003Cspan class=\u0022free-full-text\u0022\u003EFREE \u003C\/span\u003EFull Text\u003C\/span\u003E\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E9.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-9-1\u0022 title=\u0022View reference 9. in text\u0022 id=\u0022ref-9\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.9\u0022 data-doi=\u002210.1200\/JCO.2013.52.0858\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EFehrenbacher\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EL\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ECapra\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EAM\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EQuesenberry\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ECP\u003C\/span\u003E,   \u003Cspan class=\u0022cit-name-suffix\u0022\u003EJr.\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EFulton\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ER\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EShiraz\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EP\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EHabel\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ELA\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EDistant invasive breast cancer recurrence risk in human epidermal growth factor receptor 2-positive T1a and T1b node-negative localized breast cancer diagnosed from 2000 to 2006: a cohort from an integrated health care delivery system\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJ Clin Oncol\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-month\u0022\u003EJul\u003C\/span\u003E \u003Cspan class=\u0022cit-day\u0022\u003E10\u003C\/span\u003E \u003Cspan class=\u0022cit-pub-date\u0022\u003E2014\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E32\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E20\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E2151\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E8\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1200\/jco.2013.52.0858\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJ%2BClin%2BOncol%26rft_id%253Dinfo%253Adoi%252F10.1200%252FJCO.2013.52.0858%26rft_id%253Dinfo%253Apmid%252F24888815%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/ijlink\/YTozOntzOjQ6InBhdGgiO3M6MTQ6Ii9sb29rdXAvaWpsaW5rIjtzOjU6InF1ZXJ5IjthOjQ6e3M6ODoibGlua1R5cGUiO3M6NDoiQUJTVCI7czoxMToiam91cm5hbENvZGUiO3M6MzoiamNvIjtzOjU6InJlc2lkIjtzOjEwOiIzMi8yMC8yMTUxIjtzOjQ6ImF0b20iO3M6NTA6Ii9tZWRyeGl2L2Vhcmx5LzIwMjYvMDMvMjUvMjAyNi4wMy4yMy4yNjM0OTAxMi5hdG9tIjt9czo4OiJmcmFnbWVudCI7czowOiIiO30=\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-ijlink\u0022\u003E\u003Cspan\u003E\u003Cspan class=\u0022cit-reflinks-abstract\u0022\u003EAbstract\u003C\/span\u003E\u003Cspan class=\u0022cit-sep cit-reflinks-variant-name-sep\u0022\u003E\/\u003C\/span\u003E\u003Cspan class=\u0022cit-reflinks-full-text\u0022\u003E\u003Cspan class=\u0022free-full-text\u0022\u003EFREE \u003C\/span\u003EFull Text\u003C\/span\u003E\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E10.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-10-1\u0022 title=\u0022View reference 10. in text\u0022 id=\u0022ref-10\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.10\u0022 data-doi=\u002210.1001\/jamaoncol.2023.1891\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ESun\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EL\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EBleiberg\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EB\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EHwang\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EWT\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EAssociation Between Duration of Immunotherapy and Overall Survival in Advanced Non-Small Cell Lung Cancer\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJAMA Oncol\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-month\u0022\u003EAug\u003C\/span\u003E \u003Cspan class=\u0022cit-day\u0022\u003E1\u003C\/span\u003E \u003Cspan class=\u0022cit-pub-date\u0022\u003E2023\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E9\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E8\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E1075\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E1082\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1001\/jamaoncol.2023.1891\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJAMA%2BOncol%26rft.volume%253D9%26rft.spage%253D1075%26rft_id%253Dinfo%253Adoi%252F10.1001%252Fjamaoncol.2023.1891%26rft_id%253Dinfo%253Apmid%252F37270700%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1001\/jamaoncol.2023.1891\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=37270700\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2026%2F03%2F25%2F2026.03.23.26349012.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E11.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-11-1\u0022 title=\u0022View reference 11. in text\u0022 id=\u0022ref-11\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.11\u0022 data-doi=\u002210.1038\/s41746-024-01274-7\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EGupta\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ES\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EBasu\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ENievas\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EM\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EPRISM: Patient Records Interpretation for Semantic clinical trial Matching system using large language models. npj Digital Medicine\u003C\/abbr\u003E. 2024\/10\/28 \u003Cspan class=\u0022cit-pub-date\u0022\u003E2024\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E7\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E1\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E305\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1038\/s41746-024-01274-7\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DPRISM%253A%2BPatient%2BRecords%2BInterpretation%2Bfor%2BSemantic%2Bclinical%2Btrial%2BMatching%2Bsystem%2Busing%2Blarge%2Blanguage%2Bmodels.%2Bnpj%2BDigital%2BMedicine%26rft.volume%253D7%26rft.spage%253D305%26rft_id%253Dinfo%253Adoi%252F10.1038%252Fs41746-024-01274-7%26rft_id%253Dinfo%253Apmid%252F39468259%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1038\/s41746-024-01274-7\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=39468259\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2026%2F03%2F25%2F2026.03.23.26349012.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E12.\u003C\/span\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal no-rev-xref\u0022 id=\u0022cit-2026.03.23.26349012v1.12\u0022 data-doi=\u002210.1038\/s41746-025-01780-2\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EZhu\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EM\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ELin\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EH\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EJiang\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJ\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003ELarge language model trained on clinical oncology data predicts cancer progression\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003Enpj Digital Medicine\u003C\/abbr\u003E. 2025\/07\/02 \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E8\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E1\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E397\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1038\/s41746-025-01780-2\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253Dnpj%2BDigital%2BMedicine%26rft.volume%253D8%26rft.spage%253D397%26rft_id%253Dinfo%253Adoi%252F10.1038%252Fs41746-025-01780-2%26rft_id%253Dinfo%253Apmid%252F40604229%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1038\/s41746-025-01780-2\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=40604229\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2026%2F03%2F25%2F2026.03.23.26349012.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E13.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-13-1\u0022 title=\u0022View reference 13. in text\u0022 id=\u0022ref-13\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.13\u0022 data-doi=\u002210.1038\/s41586-024-08167-5\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EJee\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJ\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EFong\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EC\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EPichotta\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EK\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EAutomated real-world data integration improves cancer outcome prediction\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003ENature\u003C\/abbr\u003E. 2024\/12\/01 \u003Cspan class=\u0022cit-pub-date\u0022\u003E2024\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E636\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E8043\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E728\u003C\/span\u003E-\u003Cspan class=\u0022cit-lpage\u0022\u003E736\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1038\/s41586-024-08167-5\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DNature%26rft.volume%253D636%26rft.spage%253D728%26rft_id%253Dinfo%253Adoi%252F10.1038%252Fs41586-024-08167-5%26rft_id%253Dinfo%253Apmid%252F39506116%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1038\/s41586-024-08167-5\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=39506116\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2026%2F03%2F25%2F2026.03.23.26349012.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E14.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-14-1\u0022 title=\u0022View reference 14. in text\u0022 id=\u0022ref-14\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.14\u0022 data-doi=\u002210.1038\/s41746-025-02009-y\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ELuo\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EI\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EGraber-Naidich\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EZhang\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EM\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003ELeveraging large language models to extract smoking history from clinical notes for lung cancer surveillance\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003Enpj Digital Medicine\u003C\/abbr\u003E. 2025\/11\/28 \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E8\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E1\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E731\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1038\/s41746-025-02009-y\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253Dnpj%2BDigital%2BMedicine%26rft.volume%253D8%26rft.spage%253D731%26rft_id%253Dinfo%253Adoi%252F10.1038%252Fs41746-025-02009-y%26rft_id%253Dinfo%253Apmid%252F41315854%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1038\/s41746-025-02009-y\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=41315854\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2026%2F03%2F25%2F2026.03.23.26349012.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E15.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-15-1\u0022 title=\u0022View reference 15. in text\u0022 id=\u0022ref-15\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-web\u0022 id=\u0022cit-2026.03.23.26349012v1.15\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EGliadkovskaya\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EA.\u003C\/span\u003E\u003C\/span\u003E \u003Cspan class=\u0022cit-source\u0022\u003EOpenAI rolls out ChatGPT for Healthcare, a gen AI workspace for hospitals and clinics\u003C\/span\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2026\u003C\/span\u003E. \u003Ca href=\u0022https:\/\/www.fiercehealthcare.com\/health-tech\/openai-rolls-out-chatgpt-healthcare-genai-workspace-enterprises\u0022\u003Ehttps:\/\/www.fiercehealthcare.com\/health-tech\/openai-rolls-out-chatgpt-healthcare-genai-workspace-enterprises\u003C\/a\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E16.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-16-1\u0022 title=\u0022View reference 16. in text\u0022 id=\u0022ref-16\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.16\u0022 data-doi=\u002210.1371\/journal.pone.0264138\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EMilbury\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ECA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ECreeden\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJ\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EYip\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EWK\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EClinical and analytical validation of FoundationOne\u00aeCDx, a comprehensive genomic profiling assay for solid tumors\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EPLoS One\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2022\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E17\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E3\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003Ee0264138\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1371\/journal.pone.0264138\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DPLoS%2BOne%26rft.volume%253D17%26rft.spage%253De0264138%26rft_id%253Dinfo%253Adoi%252F10.1371%252Fjournal.pone.0264138%26rft_id%253Dinfo%253Apmid%252F35294956%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1371\/journal.pone.0264138\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=35294956\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2026%2F03%2F25%2F2026.03.23.26349012.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E17.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-17-1\u0022 title=\u0022View reference 17. in text\u0022 id=\u0022ref-17\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-web\u0022 id=\u0022cit-2026.03.23.26349012v1.17\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth cit-collab\u0022\u003EEpic Systems C.\u003C\/span\u003E \u003Cspan class=\u0022cit-source\u0022\u003ECare Everywhere. Epic Systems Corporation\u003C\/span\u003E. Updated \u003Cspan class=\u0022cit-pub-date\u0022\u003E2026\u003C\/span\u003E. \u003Ca href=\u0022https:\/\/www.epic.com\/careeverywhere\/?search=\u0026amp;country=\u0026amp;usstate\u0022\u003Ehttps:\/\/www.epic.com\/careeverywhere\/?search=\u0026amp;country=\u0026amp;usstate\u003C\/a\u003E=\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E18.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-18-1\u0022 title=\u0022View reference 18. in text\u0022 id=\u0022ref-18\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-web\u0022 id=\u0022cit-2026.03.23.26349012v1.18\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth cit-collab\u0022\u003ERepository SRD\u003C\/span\u003E. \u003Cspan class=\u0022cit-source\u0022\u003EData types in STARR\u003C\/span\u003E. \u003Ca href=\u0022https:\/\/starr.stanford.edu\/data-types\u0022\u003Ehttps:\/\/starr.stanford.edu\/data-types\u003C\/a\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E19.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-19-1\u0022 title=\u0022View reference 19. in text\u0022 id=\u0022ref-19\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.19\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ESounack\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ET\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EDavis\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJ\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EDurieux\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EB\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EBioClinical ModernBERT: A State-of-the-Art Long-Context Encoder for Biomedical and Clinical NLP\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EPreprint. arXiv\u003C\/abbr\u003E. 2025\/06\/12 \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E;\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E20.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-20-1\u0022 title=\u0022View reference 20. in text\u0022 id=\u0022ref-20\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.20\u0022 data-doi=\u002210.1561\/1500000019\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ERobertson\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ES\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EZaragoza\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EH\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EThe Probabilistic Relevance Framework: BM25 and Beyond\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EFoundations and Trends in Information Retrieval\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2009\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E3\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E4\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E333\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E389\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1561\/1500000019\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DFoundations%2Band%2BTrends%2Bin%2BInformation%2BRetrieval%26rft.volume%253D3%26rft.spage%253D333%26rft_id%253Dinfo%253Adoi%252F10.1561%252F1500000019%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1561\/1500000019\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E21.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-21-1\u0022 title=\u0022View reference 21. in text\u0022 id=\u0022ref-21\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.21\u0022 data-doi=\u002210.48550\/arXiv.1603.09320\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EMalkov\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EYA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EYashunin\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EDA\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EEfficient and robust approximate nearest neighbor search using Hierarchical Navigable Small World graphs\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EarXiv\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2018\u003C\/span\u003E;\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.48550\/arXiv.1603.09320\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DarXiv%26rft_id%253Dinfo%253Adoi%252F10.48550%252FarXiv.1603.09320%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.48550\/arXiv.1603.09320\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E22.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-22-1\u0022 title=\u0022View reference 22. in text\u0022 id=\u0022ref-22\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.22\u0022 data-doi=\u002210.21203\/rs.3.rs-5095287\/v1\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ENg\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EMY\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EHelzer\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJ\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EPfeffer\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EMA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ESeto\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ET\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EHernandez-Boussard\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ET\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EDevelopment of Secure Infrastructure for Advancing Generative AI Research in Healthcare at an Academic Medical Center\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003ERes Sq\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-month\u0022\u003ESep\u003C\/span\u003E \u003Cspan class=\u0022cit-day\u0022\u003E24\u003C\/span\u003E \u003Cspan class=\u0022cit-pub-date\u0022\u003E2024\u003C\/span\u003E;\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.21203\/rs.3.rs-5095287\/v1\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DRes%2BSq%26rft_id%253Dinfo%253Adoi%252F10.21203%252Frs.3.rs-5095287%252Fv1%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.21203\/rs.3.rs-5095287\/v1\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E23.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-23-1\u0022 title=\u0022View reference 23. in text\u0022 id=\u0022ref-23\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.23\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EJaccard\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EP\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003E\u00c9tude comparative de la distribution florale dans une portion des Alpes et des Jura\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EBulletin de la Soci\u00e9t\u00e9 Vaudoise des Sciences Naturelles\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E1901\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E7\u003C\/span\u003E:\u003Cspan class=\u0022cit-fpage\u0022\u003E547\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E579\u003C\/span\u003E.\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DBulletin%2Bde%2Bla%2BSoci%25E9t%25E9%2BVaudoise%2Bdes%2BSciences%2BNaturelles%26rft.volume%253D7%26rft.spage%253D547%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E24.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-24-1\u0022 title=\u0022View reference 24. in text\u0022 id=\u0022ref-24\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.24\u0022 data-doi=\u002210.2307\/2281868\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EKaplan\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EEL\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EMeier\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EP\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003ENonparametric Estimation from Incomplete Observations\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJournal of the American Statistical Association\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E1958\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E53\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E282\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E457\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E481\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.2307\/2281868\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJournal%2Bof%2Bthe%2BAmerican%2BStatistical%2BAssociation%26rft.volume%253D53%26rft.spage%253D457%26rft_id%253Dinfo%253Adoi%252F10.2307%252F2281868%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.2307\/2281868\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=A1958WX09300012\u0026amp;link_type=ISI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-newisilink cit-ref-sprinkles-webofscience\u0022\u003E\u003Cspan\u003EWeb of Science\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E25.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-25-1\u0022 title=\u0022View reference 25. in text\u0022 id=\u0022ref-25\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.25\u0022 data-doi=\u002210.2307\/2289144\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EEfron\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EB\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003EBetter Bootstrap Confidence Intervals\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJournal of the American Statistical Association\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E1987\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E82\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E397\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E171\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E185\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.2307\/2289144\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJournal%2Bof%2Bthe%2BAmerican%2BStatistical%2BAssociation%26rft.volume%253D82%26rft.spage%253D171%26rft_id%253Dinfo%253Adoi%252F10.2307%252F2289144%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.2307\/2289144\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=A1987G462600027\u0026amp;link_type=ISI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-newisilink cit-ref-sprinkles-webofscience\u0022\u003E\u003Cspan\u003EWeb of Science\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E26.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-26-1\u0022 title=\u0022View reference 26. in text\u0022 id=\u0022ref-26\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.26\u0022 data-doi=\u002210.1001\/jamaoncol.2024.6868\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ERansohoff\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJD\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ELewinsohn\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ERM\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EDickerson\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EJ\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EEndocrine Therapy Interruption, Resumption, and Outcomes Associated With Pregnancy After Breast Cancer\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJAMA Oncol\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-month\u0022\u003EApr\u003C\/span\u003E \u003Cspan class=\u0022cit-day\u0022\u003E1\u003C\/span\u003E \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E11\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E4\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E423\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E426\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1001\/jamaoncol.2024.6868\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJAMA%2BOncol%26rft.volume%253D11%26rft.spage%253D423%26rft_id%253Dinfo%253Adoi%252F10.1001%252Fjamaoncol.2024.6868%26rft_id%253Dinfo%253Apmid%252F39946107%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1001\/jamaoncol.2024.6868\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=39946107\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2026%2F03%2F25%2F2026.03.23.26349012.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E27.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-27-1\u0022 title=\u0022View reference 27. in text\u0022 id=\u0022ref-27\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.27\u0022 data-doi=\u002210.1186\/s12874-024-02440-x\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EPfaffenlehner\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EM\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EBehrens\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EM\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EZ\u00f6ller\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ED\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EMethodological challenges using routine clinical care data for real-world evidence: a rapid review utilizing a systematic literature search and focus group discussion\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EBMC Med Res Methodol\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-month\u0022\u003EJan\u003C\/span\u003E \u003Cspan class=\u0022cit-day\u0022\u003E14\u003C\/span\u003E \u003Cspan class=\u0022cit-pub-date\u0022\u003E2025\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E25\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E1\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E8\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1186\/s12874-024-02440-x\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DBMC%2BMed%2BRes%2BMethodol%26rft_id%253Dinfo%253Adoi%252F10.1186%252Fs12874-024-02440-x%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1186\/s12874-024-02440-x\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E28.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-28-1\u0022 title=\u0022View reference 28. in text\u0022 id=\u0022ref-28\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.28\u0022 data-doi=\u002210.1016\/j.esmorw.2023.10.001\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003ECastelo-Branco\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EL\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EPellat\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EA\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EMartins-Branco\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003ED\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-etal\u0022\u003Eet al.\u003C\/span\u003E \u003Cspan class=\u0022cit-article-title\u0022\u003EESMO Guidance for Reporting Oncology real-World evidence (GROW)\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EESMO Real World Data Digit Oncol\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-month\u0022\u003ENov\u003C\/span\u003E \u003Cspan class=\u0022cit-pub-date\u0022\u003E2023\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E1\u003C\/span\u003E:\u003Cspan class=\u0022cit-fpage\u0022\u003E100003\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1016\/j.esmorw.2023.10.001\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DESMO%2BReal%2BWorld%2BData%2BDigit%2BOncol%26rft.volume%253D1%26rft.spage%253D100003%26rft_id%253Dinfo%253Adoi%252F10.1016%252Fj.esmorw.2023.10.001%26rft_id%253Dinfo%253Apmid%252F41647770%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1016\/j.esmorw.2023.10.001\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=41647770\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2026%2F03%2F25%2F2026.03.23.26349012.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003Cli\u003E\u003Cspan class=\u0022ref-label\u0022\u003E29.\u003C\/span\u003E\u003Ca class=\u0022rev-xref-ref\u0022 href=\u0022#xref-ref-29-1\u0022 title=\u0022View reference 29. in text\u0022 id=\u0022ref-29\u0022\u003E\u21b5\u003C\/a\u003E\u003Cdiv class=\u0022cit ref-cit ref-journal\u0022 id=\u0022cit-2026.03.23.26349012v1.29\u0022 data-doi=\u002210.1001\/jama.2024.7741\u0022\u003E\u003Cdiv class=\u0022cit-metadata\u0022\u003E\u003Ccite\u003E\u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EDahabreh\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EIJ\u003C\/span\u003E\u003C\/span\u003E, \u003Cspan class=\u0022cit-auth\u0022\u003E\u003Cspan class=\u0022cit-name-surname\u0022\u003EBibbins-Domingo\u003C\/span\u003E  \u003Cspan class=\u0022cit-name-given-names\u0022\u003EK\u003C\/span\u003E\u003C\/span\u003E. \u003Cspan class=\u0022cit-article-title\u0022\u003ECausal Inference About the Effects of Interventions From Observational Studies in Medical Journals\u003C\/span\u003E. \u003Cabbr class=\u0022cit-jnl-abbrev\u0022\u003EJAMA\u003C\/abbr\u003E. \u003Cspan class=\u0022cit-pub-date\u0022\u003E2024\u003C\/span\u003E;\u003Cspan class=\u0022cit-vol\u0022\u003E331\u003C\/span\u003E(\u003Cspan class=\u0022cit-issue\u0022\u003E21\u003C\/span\u003E):\u003Cspan class=\u0022cit-fpage\u0022\u003E1845\u003C\/span\u003E\u2013\u003Cspan class=\u0022cit-lpage\u0022\u003E1853\u003C\/span\u003E.\u003Cspan class=\u0022cit-pub-id-sep cit-pub-id-doi-sep\u0022\u003E \u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id-scheme\u0022\u003Edoi:\u003C\/span\u003E\u003Cspan class=\u0022cit-pub-id cit-pub-id-doi\u0022\u003E10.1001\/jama.2024.7741\u003C\/span\u003E\u003C\/cite\u003E\u003C\/div\u003E\u003Cdiv class=\u0022cit-extra\u0022\u003E\u003Ca href=\u0022{openurl}?query=rft.jtitle%253DJAMA%26rft.volume%253D331%26rft.spage%253D1845%26rft_id%253Dinfo%253Adoi%252F10.1001%252Fjama.2024.7741%26rft_id%253Dinfo%253Apmid%252F38722735%26rft.genre%253Darticle%26rft_val_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Ajournal%26ctx_ver%253DZ39.88-2004%26url_ver%253DZ39.88-2004%26url_ctx_fmt%253Dinfo%253Aofi%252Ffmt%253Akev%253Amtx%253Actx\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-openurl cit-ref-sprinkles-open-url\u0022\u003E\u003Cspan\u003EOpenUrl\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=10.1001\/jama.2024.7741\u0026amp;link_type=DOI\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-doi cit-ref-sprinkles-crossref\u0022\u003E\u003Cspan\u003ECrossRef\u003C\/span\u003E\u003C\/a\u003E\u003Ca href=\u0022\/lookup\/external-ref?access_num=38722735\u0026amp;link_type=MED\u0026amp;atom=%2Fmedrxiv%2Fearly%2F2026%2F03%2F25%2F2026.03.23.26349012.atom\u0022 class=\u0022cit-ref-sprinkles cit-ref-sprinkles-medline\u0022\u003E\u003Cspan\u003EPubMed\u003C\/span\u003E\u003C\/a\u003E\u003C\/div\u003E\u003C\/div\u003E\u003C\/li\u003E\u003C\/ol\u003E\u003C\/div\u003E\u003Cspan class=\u0022highwire-journal-article-marker-end\u0022\u003E\u003C\/span\u003E\u003C\/div\u003E\u003Cspan class=\u0022related-urls\u0022\u003E\u003C\/span\u003E\u003C\/div\u003E\u003C\/div\u003E  \u003C\/div\u003E\n\n  \n  \u003C\/div\u003E\n\u003C\/div\u003E\n  \u003C\/div\u003E\n\u003C\/div\u003E\n\u003C\/div\u003E\u003Cscript type=\u0022text\/javascript\u0022 src=\u0022https:\/\/www.medrxiv.org\/sites\/default\/files\/js\/js_zP7WWIfzbyzvaM63L39cNV2juU_1XVH7wduFK9gcMNI.js\u0022\u003E\u003C\/script\u003E\n\u003C\/body\u003E\u003C\/html\u003E"}