{"id":"https://openalex.org/W7161713361","doi":"https://doi.org/10.48550/arxiv.2605.17792","title":"HydroAgent: Closing the Gap Between Frontier LLMs and Human Experts in Hydrologic Model Calibration via Simulator-Grounded RL","display_name":"HydroAgent: Closing the Gap Between Frontier LLMs and Human Experts in Hydrologic Model Calibration via Simulator-Grounded RL","publication_year":2026,"publication_date":"2026-05-18","ids":{"openalex":"https://openalex.org/W7161713361","doi":"https://doi.org/10.48550/arxiv.2605.17792"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.17792","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17792","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.17792","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136493184","display_name":"Zhi Li","orcid":"https://orcid.org/0009-0001-5749-4000"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Zhi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058972335","display_name":"Songkun Yan","orcid":"https://orcid.org/0009-0008-3820-104X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Songkun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136478041","display_name":"Jie Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Jie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136460475","display_name":"Mofan Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Mofan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017132290","display_name":"Anjiang Wei","orcid":"https://orcid.org/0000-0003-1654-6027"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Anjiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102178022","display_name":"J.-M. Yoo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yoo, Jinwoong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136471520","display_name":"Yang Hong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hong, Yang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11490","display_name":"Hydrological Forecasting Using AI","score":0.2687999904155731,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11490","display_name":"Hydrological Forecasting Using AI","score":0.2687999904155731,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10930","display_name":"Flood Risk Assessment and Management","score":0.2583000063896179,"subfield":{"id":"https://openalex.org/subfields/2306","display_name":"Global and Planetary Change"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10330","display_name":"Hydrology and Watershed Management Studies","score":0.20090000331401825,"subfield":{"id":"https://openalex.org/subfields/2312","display_name":"Water Science and Technology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hydrological-modelling","display_name":"Hydrological modelling","score":0.46880000829696655},{"id":"https://openalex.org/keywords/hydrograph","display_name":"Hydrograph","score":0.4514999985694885},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.4336000084877014},{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.3756999969482422},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.3450999855995178},{"id":"https://openalex.org/keywords/water-resources","display_name":"Water resources","score":0.31850001215934753},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.3109000027179718}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6437000036239624},{"id":"https://openalex.org/C126197015","wikidata":"https://www.wikidata.org/wiki/Q1586683","display_name":"Hydrological modelling","level":2,"score":0.46880000829696655},{"id":"https://openalex.org/C154936535","wikidata":"https://www.wikidata.org/wiki/Q320062","display_name":"Hydrograph","level":3,"score":0.4514999985694885},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.4336000084877014},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.3756999969482422},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.3450999855995178},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.3433000147342682},{"id":"https://openalex.org/C39432304","wikidata":"https://www.wikidata.org/wiki/Q188847","display_name":"Environmental science","level":0,"score":0.3215999901294708},{"id":"https://openalex.org/C153823671","wikidata":"https://www.wikidata.org/wiki/Q1049799","display_name":"Water resources","level":2,"score":0.31850001215934753},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.3109000027179718},{"id":"https://openalex.org/C183030095","wikidata":"https://www.wikidata.org/wiki/Q255894","display_name":"Equifinality","level":2,"score":0.29820001125335693},{"id":"https://openalex.org/C207319327","wikidata":"https://www.wikidata.org/wiki/Q41453","display_name":"Diatreme","level":4,"score":0.28949999809265137},{"id":"https://openalex.org/C8505890","wikidata":"https://www.wikidata.org/wiki/Q605095","display_name":"Budget constraint","level":2,"score":0.28700000047683716},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.2800999879837036},{"id":"https://openalex.org/C76886044","wikidata":"https://www.wikidata.org/wiki/Q2883300","display_name":"Hydrology (agriculture)","level":2,"score":0.2793999910354614},{"id":"https://openalex.org/C150547873","wikidata":"https://www.wikidata.org/wiki/Q947851","display_name":"Watershed","level":2,"score":0.2703999876976013},{"id":"https://openalex.org/C74256435","wikidata":"https://www.wikidata.org/wiki/Q134052","display_name":"Flood myth","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.2531000077724457}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.17792","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17792","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.17792","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17792","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.5524158477783203,"display_name":"Clean water and sanitation","id":"https://metadata.un.org/sdg/6"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Calibrating":[0],"distributed":[1,96],"hydrologic":[2,66,97],"models":[3,141],"is":[4,163,219],"a":[5,41,165,169,194,212,220,252],"critical":[6],"bottleneck":[7],"across":[8,113,131],"operational":[9,94],"water":[10],"resources":[11],"management":[12],"-":[13,81,91,201,239,248],"streamflow":[14],"prediction,":[15],"reservoir":[16],"operation,":[17],"drought":[18],"monitoring,":[19],"infrastructure":[20],"design,":[21],"and":[22,45,68,88,135,147,187,223,232,245],"flood":[23],"forecasting":[24],"all":[25,132],"depend":[26],"on":[27,92,156,182],"it.":[28],"Each":[29],"basin":[30],"demands":[31],"an":[32],"expert":[33,184],"to":[34,124],"translate":[35],"hydrograph":[36],"signatures":[37],"into":[38],"adjustments":[39],"of":[40,236],"high-dimensional":[42],"parameter":[43],"vector,":[44],"the":[46,64,93,101,128,139,144,151,233],"resulting":[47],"workflow":[48],"does":[49],"not":[50,164],"transfer":[51],"between":[52],"watersheds.":[53],"We":[54,75,159,172],"ask:":[55],"can":[56],"frontier":[57,78,230],"large":[58],"language":[59],"model":[60,98,149],"(LLM)":[61],"agents":[62,80,251],"replace":[63],"human":[65],"modeler,":[67],"if":[69],"not,":[70],"what":[71],"would":[72],"it":[73],"take?":[74],"benchmark":[76],"nine":[77],"LLM":[79],"Claude":[82],"Opus":[83],"4.6/4.7,":[84],"Sonnet":[85],"4.6,":[86],"GPT-5/5.4/5.4-pro,":[87],"Gemini":[89],"2.5-pro/3.1-pro/3-flash":[90],"CREST":[95,199],"used":[99],"by":[100],"U.S.":[102],"National":[103],"Weather":[104],"Service":[105],"for":[106,255],"flash-flood":[107],"forecasting.":[108],"Best-of-twenty-rounds":[109],"Nash-Sutcliffe":[110],"Efficiency":[111],"(NSE)":[112],"four":[114],"held-out":[115],"gauges":[116],"spanning":[117],"329-40,792":[118],"km2":[119],"ranges":[120],"from":[121,197],"-0.16":[122],"(GPT-5.4)":[123],"0.75":[125],"(Sonnet":[126],"4.6);":[127],"ceiling":[129],"reproduces":[130],"three":[133],"vendors":[134],"capability":[136],"tiers,":[137],"with":[138,179,204,216],"strongest":[140],"concentrating":[142],"in":[143,257],"0.65-0.75":[145],"band,":[146],"no":[148],"reaches":[150],"human-expert":[152],"reference":[153],"except":[154],"Opus-4.7":[155],"one":[157],"gauge.":[158],"argue":[160],"this":[161],"gap":[162],"parameter-count":[166],"problem":[167],"but":[168],"domain-grounding":[170],"problem.":[171],"then":[173],"propose":[174],"HYDROAGENT,":[175],"fine-tuning":[176,181],"open-weight":[177],"Qwen3-4B":[178],"supervised":[180],"2,576":[183],"calibration":[185],"trajectories":[186],"Group-Relative":[188],"Policy":[189],"Optimization":[190],"using":[191],"NSE":[192],"as":[193],"verifiable":[195],"reward":[196],"online":[198],"simulations":[200],"reinforcement":[202],"learning":[203],"simulation":[205],"feedback":[206],"(RLSF).":[207],"For":[208],"Earth":[209,237],"system":[210],"science,":[211],"small":[213],"domain-tuned":[214],"policy":[215],"simulator-in-the-loop":[217],"RL":[218],"more":[221],"compute-efficient":[222],"physically":[224],"faithful":[225],"path":[226],"than":[227],"scaling":[228],"generic":[229],"models,":[231],"multi-modal":[234],"richness":[235],"data":[238],"remote":[240],"sensing,":[241],"in-situ":[242],"time":[243],"series,":[244],"forecaster":[246],"narrative":[247],"makes":[249],"domain":[250],"leveraged":[253],"direction":[254],"AI":[256],"physical":[258],"science.":[259]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-20T00:00:00"}
