{"id":"https://openalex.org/W7155051620","doi":"https://doi.org/10.48550/arxiv.2604.16694","title":"RankGuide: Tensor-Rank-Guided Routing and Steering for Efficient Reasoning","display_name":"RankGuide: Tensor-Rank-Guided Routing and Steering for Efficient Reasoning","publication_year":2026,"publication_date":"2026-04-17","ids":{"openalex":"https://openalex.org/W7155051620","doi":"https://doi.org/10.48550/arxiv.2604.16694"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.16694","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.16694","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.16694","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134160128","display_name":"Jiayi Tian","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Tian, Jiayi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134199907","display_name":"Yupeng Su","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Yupeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032765315","display_name":"Ryan Solgi","orcid":"https://orcid.org/0000-0002-7560-5210"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Solgi, Ryan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134133373","display_name":"Souvik Kundu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kundu, Souvik","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134196353","display_name":"Zheng Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Zheng","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5134160128"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.4724999964237213,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.4724999964237213,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.24279999732971191,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.05380000174045563,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.7598999738693237},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.6175000071525574},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5530999898910522},{"id":"https://openalex.org/keywords/routing","display_name":"Routing (electronic design automation)","score":0.5031999945640564},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.38429999351501465},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.3824999928474426},{"id":"https://openalex.org/keywords/reasoning-system","display_name":"Reasoning system","score":0.32030001282691956}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.7598999738693237},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.755299985408783},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.6175000071525574},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5530999898910522},{"id":"https://openalex.org/C74172769","wikidata":"https://www.wikidata.org/wiki/Q1446839","display_name":"Routing (electronic design automation)","level":2,"score":0.5031999945640564},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.38429999351501465},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.3824999928474426},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37689998745918274},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3305000066757202},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.32030001282691956},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.30000001192092896},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.29600000381469727},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.28619998693466187},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.26820001006126404},{"id":"https://openalex.org/C2984173633","wikidata":"https://www.wikidata.org/wiki/Q22725","display_name":"Routing algorithm","level":4,"score":0.2605000138282776},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.25949999690055847},{"id":"https://openalex.org/C3018263672","wikidata":"https://www.wikidata.org/wiki/Q1296251","display_name":"Efficient algorithm","level":2,"score":0.2581999897956848}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.16694","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.16694","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.16694","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.16694","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"reasoning":[1,38,43,160,187,197],"models":[2,39],"(LRMs)":[3],"enhance":[4],"problem-solving":[5],"capabilities":[6],"by":[7,207],"generating":[8],"explicit":[9],"multi-step":[10],"chains":[11],"of":[12,89,112,162,202],"thought":[13],"(CoT)":[14],"reasoning;":[15],"however,":[16],"they":[17],"incur":[18],"substantial":[19],"inference":[20,76],"latency":[21,206],"and":[22,55,58,82,85,94,110,118,143,173,191],"computational":[23],"overhead.":[24],"To":[25,69],"mitigate":[26],"this":[27,71],"issue,":[28,72],"recent":[29,52],"works":[30],"have":[31],"explored":[32],"model":[33],"collaboration":[34,114],"paradigms,":[35],"where":[36],"small":[37],"(SRMs)":[40],"generate":[41],"intermediate":[42],"steps":[44,190],"to":[45,135,141,157,183,209,212,219],"achieve":[46,184],"a":[47,66,104,123,151],"better":[48],"accuracy--latency":[49],"trade-off.":[50],"Despite":[51],"progress,":[53],"effectively":[54],"efficiently":[56],"detecting":[57],"mitigating":[59],"SRM":[60,75],"failures":[61],"in":[62,77,204],"collaborative":[63,181],"systems":[64,182],"remains":[65],"key":[67],"challenge.":[68],"address":[70],"we":[73,101,149],"analyze":[74],"both":[78,171],"the":[79,108,159,200],"generated":[80],"text":[81],"hidden-state":[83],"spaces,":[84],"identify":[86],"three":[87],"types":[88],"failure":[90],"modes:":[91],"\\textit{overconfidence},":[92],"\\textit{uncertainty},":[93],"\\textit{heavy":[95],"revalidation}.":[96],"Building":[97],"on":[98,195],"these":[99],"insights,":[100],"propose":[102],"\\textbf{RankGuide},":[103],"framework":[105],"that":[106,126],"improves":[107],"efficiency":[109],"effectiveness":[111],"SRM--LRM":[113,180],"through":[115,175],"tensor-rank-guided":[116],"routing":[117,124,172],"steering.":[119],"Specifically,":[120],"RankGuide":[121,178,203],"leverages":[122],"signal":[125],"incorporates":[127],"tensor-rank":[128,176],"signals":[129],"derived":[130],"from":[131],"consecutive":[132],"hidden":[133],"states":[134],"detect":[136],"when":[137],"SRMs":[138],"are":[139],"likely":[140],"fail":[142],"selectively":[144],"invoke":[145],"LRMs.":[146],"In":[147],"addition,":[148],"introduce":[150],"tensor-rank-filtered":[152],"steering":[153,174],"vector":[154],"extraction":[155],"method":[156],"modulate":[158],"trajectory":[161],"SRMs,":[163],"thereby":[164],"improving":[165,170],"their":[166],"generation":[167],"quality.":[168],"By":[169],"signals,":[177],"enables":[179],"more":[185],"efficient":[186],"with":[188],"fewer":[189],"improved":[192],"accuracy.":[193],"Experiments":[194],"multiple":[196],"benchmarks":[198],"demonstrate":[199],"efficacy":[201],"reducing":[205],"up":[208],"$1.75\\times$":[210],"compared":[211],"LRM,":[213],"while":[214],"maintaining":[215],"competitive":[216],"accuracy":[217],"relative":[218],"prior":[220],"methods.":[221]},"counts_by_year":[],"updated_date":"2026-04-22T06:07:44.442478","created_date":"2026-04-22T00:00:00"}
