{"id":"https://openalex.org/W7133313496","doi":"https://doi.org/10.48550/arxiv.2603.01025","title":"One-Token Verification for Reasoning Correctness Estimation","display_name":"One-Token Verification for Reasoning Correctness Estimation","publication_year":2026,"publication_date":"2026-03-01","ids":{"openalex":"https://openalex.org/W7133313496","doi":"https://doi.org/10.48550/arxiv.2603.01025"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.01025","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01025","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.01025","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5122852808","display_name":"Zhan Zhuang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhuang, Zhan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128025195","display_name":"Xiequn Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Xiequn","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124335653","display_name":"Zebin Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Zebin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127980138","display_name":"Feiyang Ye","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ye, Feiyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127902503","display_name":"Ying Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Ying","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123016042","display_name":"Kede Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Kede","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128012492","display_name":"Yu Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5122852808"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3160000145435333,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3160000145435333,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.09880000352859497,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.09279999881982803,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.921500027179718},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.6711999773979187},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5702000260353088},{"id":"https://openalex.org/keywords/model-based-reasoning","display_name":"Model-based reasoning","score":0.5022000074386597},{"id":"https://openalex.org/keywords/reasoning-system","display_name":"Reasoning system","score":0.49059998989105225},{"id":"https://openalex.org/keywords/qualitative-reasoning","display_name":"Qualitative reasoning","score":0.46470001339912415},{"id":"https://openalex.org/keywords/automated-reasoning","display_name":"Automated reasoning","score":0.40939998626708984},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.3840999901294708}],"concepts":[{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.921500027179718},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7598000168800354},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.6711999773979187},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5702000260353088},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5370000004768372},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.5022000074386597},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.49059998989105225},{"id":"https://openalex.org/C83725634","wikidata":"https://www.wikidata.org/wiki/Q7268699","display_name":"Qualitative reasoning","level":2,"score":0.46470001339912415},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.40939998626708984},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.3840999901294708},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3781999945640564},{"id":"https://openalex.org/C97364631","wikidata":"https://www.wikidata.org/wiki/Q484284","display_name":"Deductive reasoning","level":2,"score":0.3682999908924103},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3626999855041504},{"id":"https://openalex.org/C20162079","wikidata":"https://www.wikidata.org/wiki/Q1151406","display_name":"Case-based reasoning","level":2,"score":0.3449000120162964},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3431999981403351},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.32280001044273376},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.3154999911785126},{"id":"https://openalex.org/C520049643","wikidata":"https://www.wikidata.org/wiki/Q189760","display_name":"Voting","level":3,"score":0.30709999799728394},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.2881999909877777},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.28459998965263367},{"id":"https://openalex.org/C111498074","wikidata":"https://www.wikidata.org/wiki/Q173326","display_name":"Formal verification","level":2,"score":0.2759999930858612},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.2612999975681305}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.01025","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01025","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.01025","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01025","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"breakthroughs":[1],"in":[2,12,30,99],"large":[3],"language":[4],"models":[5],"(LLMs)":[6],"have":[7],"led":[8],"to":[9,121,162],"notable":[10],"successes":[11],"complex":[13],"reasoning":[14,33,78,97,124,146],"tasks,":[15],"such":[16],"as":[17],"mathematical":[18,145],"problem":[19],"solving.":[20],"A":[21],"common":[22],"strategy":[23],"for":[24,65,71],"improving":[25],"performance":[26],"is":[27,41,107],"parallel":[28],"thinking,":[29],"which":[31],"multiple":[32],"traces":[34,79],"are":[35,80],"generated":[36],"and":[37,113],"the":[38,74,116,127],"final":[39],"prediction":[40],"made":[42],"using":[43],"aggregation":[44],"schemes":[45],"like":[46],"majority":[47],"voting":[48],"or":[49],"best-of-$N$":[50],"decoding.":[51],"However,":[52],"two":[53],"key":[54],"challenges":[55],"persist.":[56],"First,":[57],"multi-sample":[58],"decoding":[59],"incurs":[60],"substantial":[61],"inference":[62],"latency,":[63],"especially":[64],"long-form":[66],"outputs.":[67],"Second,":[68],"effective":[69],"mechanisms":[70],"reliably":[72],"assessing":[73],"correctness":[75,98,132],"of":[76,137],"individual":[77],"still":[81],"limited.":[82],"To":[83],"address":[84],"these":[85],"challenges,":[86],"we":[87],"introduce":[88],"One-Token":[89],"Verification":[90],"(OTV),":[91],"a":[92,100,110],"computational":[93],"method":[94],"that":[95,149],"estimates":[96],"single":[101],"forward":[102],"pass":[103],"during":[104],"generation.":[105],"OTV":[106,150,156],"activated":[108],"by":[109,160],"learnable":[111],"token":[112,158],"integrated":[114],"into":[115],"LLM":[117],"via":[118],"low-rank":[119],"adaptation":[120],"probe":[122],"internal":[123],"signals":[125],"through":[126,164],"key-value":[128],"cache,":[129],"supporting":[130],"token-level":[131],"estimation":[133],"at":[134],"any":[135],"stage":[136],"generation":[138],"without":[139],"disrupting":[140],"primary":[141],"reasoning.":[142],"Experiments":[143],"on":[144],"benchmarks":[147],"demonstrate":[148],"consistently":[151],"surpasses":[152],"existing":[153],"verifiers.":[154],"Additionally,":[155],"reduces":[157],"usage":[159],"up":[161],"$90\\%$":[163],"correctness-guided":[165],"early":[166],"termination,":[167],"prioritizing":[168],"shorter,":[169],"more":[170],"reliable":[171],"solutions.":[172]},"counts_by_year":[],"updated_date":"2026-03-04T07:09:34.246503","created_date":"2026-03-04T00:00:00"}
