{"id":"https://openalex.org/W7154482220","doi":"https://doi.org/10.48550/arxiv.2604.12385","title":"From Myopic Selection to Long-Horizon Awareness: Sequential LLM Routing for Multi-Turn Dialogue","display_name":"From Myopic Selection to Long-Horizon Awareness: Sequential LLM Routing for Multi-Turn Dialogue","publication_year":2026,"publication_date":"2026-04-14","ids":{"openalex":"https://openalex.org/W7154482220","doi":"https://doi.org/10.48550/arxiv.2604.12385"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.12385","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.12385","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.12385","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133727370","display_name":"Jiarui Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Jiarui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133676231","display_name":"Xiangyu Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xiangyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133669041","display_name":"Yong Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Yong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133679818","display_name":"Chaoyue Niu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Niu, Chaoyue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109578074","display_name":"Hang Zeng","orcid":"https://orcid.org/0009-0009-6841-9872"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zeng, Hang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101671433","display_name":"Shaojie Tang","orcid":"https://orcid.org/0000-0003-1323-6939"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Shaojie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133644700","display_name":"Fan Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Fan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5121620022","display_name":"Guihai Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Guihai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.5910999774932861,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.5910999774932861,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.2533000111579895,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.026000000536441803,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/routing","display_name":"Routing (electronic design automation)","score":0.7544999718666077},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.723800003528595},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6808000206947327},{"id":"https://openalex.org/keywords/policy-based-routing","display_name":"Policy-based routing","score":0.44859999418258667},{"id":"https://openalex.org/keywords/static-routing","display_name":"Static routing","score":0.42590001225471497},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.41940000653266907},{"id":"https://openalex.org/keywords/adaptive-routing","display_name":"Adaptive routing","score":0.33399999141693115}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.781000018119812},{"id":"https://openalex.org/C74172769","wikidata":"https://www.wikidata.org/wiki/Q1446839","display_name":"Routing (electronic design automation)","level":2,"score":0.7544999718666077},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.723800003528595},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6808000206947327},{"id":"https://openalex.org/C196423136","wikidata":"https://www.wikidata.org/wiki/Q7209671","display_name":"Policy-based routing","level":5,"score":0.44859999418258667},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4307999908924103},{"id":"https://openalex.org/C204948658","wikidata":"https://www.wikidata.org/wiki/Q1119410","display_name":"Static routing","level":4,"score":0.42590001225471497},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.41940000653266907},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3725999891757965},{"id":"https://openalex.org/C24856439","wikidata":"https://www.wikidata.org/wiki/Q352483","display_name":"Adaptive routing","level":5,"score":0.33399999141693115},{"id":"https://openalex.org/C2984173633","wikidata":"https://www.wikidata.org/wiki/Q22725","display_name":"Routing algorithm","level":4,"score":0.3212999999523163},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.32120001316070557},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.3116999864578247},{"id":"https://openalex.org/C2983435990","wikidata":"https://www.wikidata.org/wiki/Q22725","display_name":"Network routing","level":3,"score":0.28189998865127563},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.2770000100135803},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2720000147819519},{"id":"https://openalex.org/C76522221","wikidata":"https://www.wikidata.org/wiki/Q5035396","display_name":"Multipath routing","level":5,"score":0.2667999863624573},{"id":"https://openalex.org/C166109690","wikidata":"https://www.wikidata.org/wiki/Q4677422","display_name":"Action selection","level":3,"score":0.2621999979019165}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.12385","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.12385","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.12385","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.12385","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Multi-turn":[0],"dialogue":[1,30,65,107],"is":[2,16],"the":[3],"predominant":[4],"form":[5],"of":[6,113],"interaction":[7,33],"with":[8,75,90,142],"large":[9],"language":[10],"models":[11],"(LLMs).":[12],"While":[13],"LLM":[14,70],"routing":[15,51,84,97,128],"effective":[17],"in":[18,28,130],"single-turn":[19,46],"settings,":[20],"existing":[21,127],"methods":[22],"fail":[23],"to":[24,32,48,63],"maximize":[25],"cumulative":[26,77],"performance":[27],"multi-turn":[29,53,96],"due":[31],"dynamics":[34],"and":[35,72,105,116,126],"delayed":[36],"rewards.":[37,78],"To":[38],"address":[39],"this":[40],"challenge,":[41],"we":[42,56],"move":[43],"from":[44,86],"myopic,":[45],"selection":[47],"long-horizon":[49],"sequential":[50],"for":[52],"dialogue.":[54],"Accordingly,":[55],"propose":[57],"DialRouter,":[58],"which":[59],"first":[60],"performs":[61],"MCTS":[62],"explore":[64],"branches":[66],"induced":[67],"by":[68],"different":[69],"selections":[71],"collect":[73],"trajectories":[74],"high":[76],"DialRouter":[79,121],"then":[80],"learns":[81],"a":[82,136,143],"lightweight":[83],"policy":[85],"search-derived":[87],"data,":[88],"augmented":[89],"retrieval-based":[91],"future":[92],"state":[93],"approximation,":[94],"enabling":[95],"without":[98],"online":[99],"search.":[100],"Experiments":[101],"on":[102],"both":[103,114],"open-domain":[104],"domain-specific":[106],"tasks":[108],"across":[109],"diverse":[110],"candidate":[111],"sets":[112],"open-source":[115],"closed-source":[117],"LLMs":[118,125],"demonstrate":[119],"that":[120],"significantly":[122],"outperforms":[123],"single":[124],"baselines":[129],"task":[131],"success":[132],"rate,":[133],"while":[134],"achieving":[135],"superior":[137],"performance-cost":[138],"trade-off":[139],"when":[140],"combined":[141],"cost-aware":[144],"reward.":[145]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-16T00:00:00"}
