{"id":"https://openalex.org/W7157169782","doi":"https://doi.org/10.48550/arxiv.2604.23623","title":"Tandem: Riding Together with Large and Small Language Models for Efficient Reasoning","display_name":"Tandem: Riding Together with Large and Small Language Models for Efficient Reasoning","publication_year":2026,"publication_date":"2026-04-26","ids":{"openalex":"https://openalex.org/W7157169782","doi":"https://doi.org/10.48550/arxiv.2604.23623"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.23623","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.23623","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.23623","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134805743","display_name":"Zichuan Fu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Fu, Zichuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134759359","display_name":"Xian Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Xian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134801797","display_name":"Guojing Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Guojing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134800477","display_name":"Yejing Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yejing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134753208","display_name":"Yijun Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yijun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134775019","display_name":"Zihao Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Zihao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134820820","display_name":"Yixuan Luo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luo, Yixuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122243046","display_name":"Hanyu Yan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Hanyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134782959","display_name":"Yefeng Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Yefeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134798490","display_name":"Xiangyu Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Xiangyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5134805743"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3463999927043915,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3463999927043915,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.13920000195503235,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.08860000222921371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5623999834060669},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.46050000190734863},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.41929998993873596},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.41499999165534973},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.4113999903202057},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.41130000352859497},{"id":"https://openalex.org/keywords/model-based-reasoning","display_name":"Model-based reasoning","score":0.41100001335144043},{"id":"https://openalex.org/keywords/computational-model","display_name":"Computational model","score":0.391400009393692},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.37790000438690186}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7967000007629395},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5623999834060669},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4993000030517578},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.46050000190734863},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.41929998993873596},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.41499999165534973},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.4113999903202057},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.41130000352859497},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.41100001335144043},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.391400009393692},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.37790000438690186},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3555000126361847},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.35019999742507935},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.3416999876499176},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.34040001034736633},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.3237000107765198},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.32100000977516174},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.32010000944137573},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.30230000615119934},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.29420000314712524},{"id":"https://openalex.org/C159032336","wikidata":"https://www.wikidata.org/wiki/Q2488768","display_name":"Non-monotonic logic","level":2,"score":0.2793000042438507},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.27390000224113464},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2680000066757202},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.2639000117778778},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.2624000012874603},{"id":"https://openalex.org/C20162079","wikidata":"https://www.wikidata.org/wiki/Q1151406","display_name":"Case-based reasoning","level":2,"score":0.26089999079704285}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.23623","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.23623","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.23623","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.23623","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.5533388257026672,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"advancements":[1],"in":[2,102],"large":[3,56],"language":[4,59],"models":[5,16,60],"(LLMs)":[6],"have":[7],"catalyzed":[8],"the":[9,40,74,104,110,138,170],"rise":[10],"of":[11,86,137],"reasoning-intensive":[12],"inference":[13],"paradigms,":[14],"where":[15],"perform":[17],"explicit":[18],"step-by-step":[19],"reasoning":[20,67,88,106,129,144],"before":[21],"generating":[22,82],"final":[23,111],"answers.":[24],"While":[25],"such":[26],"approaches":[27],"improve":[28],"answer":[29],"quality":[30],"and":[31,57,62,108,116,145],"interpretability,":[32],"they":[33],"incur":[34],"substantial":[35],"computational":[36,71,153],"overhead":[37],"due":[38],"to":[39,64,95,159,179],"prolonged":[41],"generation":[42,147],"sequences.":[43],"In":[44],"this":[45],"paper,":[46],"we":[47],"propose":[48],"Tandem,":[49],"a":[50,78,83,97,120],"novel":[51],"collaborative":[52],"framework":[53],"that":[54,124,150],"synergizes":[55],"small":[58],"(LLMs":[61],"SLMs)":[63],"achieve":[65],"high-quality":[66],"with":[68],"significantly":[69],"reduced":[70],"cost.":[72],"Specifically,":[73],"LLM":[75,161],"serves":[76],"as":[77],"strategic":[79],"coordinator,":[80],"efficiently":[81],"compact":[84],"set":[85],"critical":[87],"insights.":[89],"These":[90],"insights":[91],"are":[92],"then":[93],"used":[94],"guide":[96],"smaller,":[98],"more":[99],"efficient":[100],"SLM":[101],"executing":[103],"full":[105],"process":[107],"delivering":[109],"response.":[112],"To":[113],"balance":[114],"efficiency":[115],"reliability,":[117],"Tandem":[118,151],"introduces":[119],"cost-aware":[121],"termination":[122],"mechanism":[123],"adaptively":[125],"determines":[126],"when":[127],"sufficient":[128],"guidance":[130],"has":[131],"been":[132],"accumulated,":[133],"enabling":[134],"early":[135],"stopping":[136],"LLM's":[139],"generation.":[140],"Experiments":[141],"on":[142,174],"mathematical":[143],"code":[146,184],"benchmarks":[148],"demonstrate":[149],"reduces":[152],"costs":[154],"by":[155],"approximately":[156],"40%":[157],"compared":[158],"standalone":[160],"reasoning,":[162],"while":[163],"achieving":[164],"superior":[165],"or":[166],"competitive":[167],"performance.":[168],"Furthermore,":[169],"sufficiency":[171],"classifier":[172],"trained":[173],"one":[175],"domain":[176],"transfers":[177],"effectively":[178],"others":[180],"without":[181],"retraining.":[182],"The":[183],"is":[185],"available":[186],"at:":[187],"https://github.com/Applied-Machine-Learning-Lab/ACL2026_Tandem.":[188]},"counts_by_year":[],"updated_date":"2026-04-29T06:16:36.941037","created_date":"2026-04-29T00:00:00"}
