{"id":"https://openalex.org/W7140330028","doi":"https://doi.org/10.48550/arxiv.2603.22327","title":"Evaluating AI-based Scientific Knowledge Synthesis with Epidemiological Systematic Reviews","display_name":"Evaluating AI-based Scientific Knowledge Synthesis with Epidemiological Systematic Reviews","publication_year":2026,"publication_date":"2026-03-20","ids":{"openalex":"https://openalex.org/W7140330028","doi":"https://doi.org/10.48550/arxiv.2603.22327"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.22327","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22327","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.22327","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130567050","display_name":"Shreyansh Padarha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Padarha, Shreyansh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130559103","display_name":"Ryan Othniel Kearns","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kearns, Ryan Othniel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011909343","display_name":"Tristan Naidoo","orcid":"https://orcid.org/0000-0001-9970-2421"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Naidoo, Tristan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101227006","display_name":"Lingyi Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Lingyi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130542457","display_name":"\u0141ukasz Borchmann","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Borchmann, \u0141ukasz","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012595564","display_name":"P. B\u0142aszczyk","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"B\u0141aszczyk, Piotr","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130564645","display_name":"Christian Morgenstern","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Morgenstern, Christian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091706473","display_name":"Ruth McCabe","orcid":"https://orcid.org/0000-0002-6368-9103"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"McCabe, Ruth","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009786456","display_name":"Sangeeta Bhatia","orcid":"https://orcid.org/0000-0001-6525-101X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhatia, Sangeeta","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130606591","display_name":"Philip H. Torr","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Torr, Philip H.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130604435","display_name":"Jakob Foerster","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Foerster, Jakob","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130629054","display_name":"Scott A. Hale","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hale, Scott A.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049683887","display_name":"Thomas Rawson","orcid":"https://orcid.org/0000-0001-8182-4279"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rawson, Thomas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130606388","display_name":"Anne Cori","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cori, Anne","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086142243","display_name":"Elizaveta Semenova","orcid":"https://orcid.org/0000-0002-8271-2575"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Semenova, Elizaveta","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5055914149","display_name":"Adam Mahdi","orcid":"https://orcid.org/0000-0002-2329-4457"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mahdi, Adam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":16,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.18860000371932983,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.18860000371932983,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11819","display_name":"Data-Driven Disease Surveillance","score":0.15449999272823334,"subfield":{"id":"https://openalex.org/subfields/2713","display_name":"Epidemiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.10700000077486038,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/systematic-review","display_name":"Systematic review","score":0.8188999891281128},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5873000025749207},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5055999755859375},{"id":"https://openalex.org/keywords/causal-inference","display_name":"Causal inference","score":0.5016000270843506},{"id":"https://openalex.org/keywords/scientific-literature","display_name":"Scientific literature","score":0.4404999911785126},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.43720000982284546}],"concepts":[{"id":"https://openalex.org/C189708586","wikidata":"https://www.wikidata.org/wiki/Q1504425","display_name":"Systematic review","level":3,"score":0.8188999891281128},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.6090999841690063},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5873000025749207},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5612999796867371},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5055999755859375},{"id":"https://openalex.org/C158600405","wikidata":"https://www.wikidata.org/wiki/Q5054566","display_name":"Causal inference","level":2,"score":0.5016000270843506},{"id":"https://openalex.org/C2781083858","wikidata":"https://www.wikidata.org/wiki/Q17327049","display_name":"Scientific literature","level":2,"score":0.4404999911785126},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.43720000982284546},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.42309999465942383},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.362199991941452},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.35600000619888306},{"id":"https://openalex.org/C100253034","wikidata":"https://www.wikidata.org/wiki/Q196372","display_name":"Systematic error","level":2,"score":0.3547999858856201},{"id":"https://openalex.org/C2777466982","wikidata":"https://www.wikidata.org/wiki/Q5227287","display_name":"Data extraction","level":3,"score":0.3384000062942505},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3330000042915344},{"id":"https://openalex.org/C2778571376","wikidata":"https://www.wikidata.org/wiki/Q1355821","display_name":"Frontier","level":2,"score":0.29120001196861267},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2784000039100647},{"id":"https://openalex.org/C124056412","wikidata":"https://www.wikidata.org/wiki/Q3320364","display_name":"Scientific evidence","level":2,"score":0.2502000033855438}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.22327","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22327","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.22327","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22327","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.6645535230636597,"id":"https://metadata.un.org/sdg/3","display_name":"Good health and well-being"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Systematic":[0],"literature":[1],"reviews":[2],"(SLRs)":[3],"are":[4,152],"a":[5,29,81,119],"demanding":[6],"and":[7,38,69,97],"high-stakes":[8],"form":[9],"of":[10,54,130],"scientific":[11],"knowledge":[12],"synthesis":[13],"that":[14,99,148],"remains":[15],"underspecified":[16],"as":[17,80],"an":[18,34,39,126],"evaluation":[19,31],"setting":[20],"for":[21,157],"large":[22],"language":[23],"models":[24,96,151],"(LLMs).":[25],"We":[26,91],"introduce":[27],"AgentSLR,":[28],"large-scale":[30],"harness":[32,75],"comprising":[33],"SLR":[35],"automation":[36],"workflow":[37],"expert":[40],"annotated":[41],"dataset":[42],"covering":[43],"16,248":[44],"articles,":[45],"designed":[46],"to":[47,138],"test":[48],"LLM":[49],"capabilities":[50],"across":[51,104,141],"the":[52,149],"stages":[53],"SLRs":[55],"in":[56,160],"epidemiology.":[57],"Reference":[58],"annotations":[59],"were":[60],"derived":[61],"from":[62],"peer-reviewed":[63],"studies":[64],"on":[65],"WHO":[66],"priority":[67],"pathogens":[68],"produced":[70],"by":[71,112,136],"domain":[72],"experts.":[73],"The":[74],"evaluates":[76],"each":[77],"review":[78],"stage":[79],"separate":[82],"unit":[83],"with":[84,122],"dedicated":[85],"metrics":[86],"enabling":[87],"targeted":[88],"failure":[89,145],"analysis.":[90],"evaluated":[92,142,150],"five":[93],"frontier":[94],"reasoning":[95],"found":[98],"no":[100,123],"single":[101],"model":[102,124],"dominated":[103],"all":[105],"tasks,":[106],"showing":[107],"sub-task":[108],"specialisation":[109],"often":[110],"hidden":[111],"aggregate":[113],"benchmarks.":[114],"Structured":[115],"data":[116],"extraction":[117],"is":[118],"major":[120],"bottleneck,":[121],"exceeding":[125],"average":[127],"field-level":[128],"F1":[129],"0.67.":[131],"Estimated":[132],"costs":[133],"vary":[134],"substantially,":[135],"up":[137],"96":[139],"times":[140],"models.":[143],"Documented":[144],"modes":[146],"suggest":[147],"not":[153],"yet":[154],"reliable":[155],"enough":[156],"unsupervised":[158],"deployment":[159],"epidemiology,":[161],"where":[162],"findings":[163],"can":[164],"inform":[165],"public":[166],"policy.":[167]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-26T00:00:00"}
