{"id":"https://openalex.org/W7160951195","doi":"https://doi.org/10.48550/arxiv.2605.08665","title":"Hint Tuning: Less Data Makes Better Reasoners","display_name":"Hint Tuning: Less Data Makes Better Reasoners","publication_year":2026,"publication_date":"2026-05-09","ids":{"openalex":"https://openalex.org/W7160951195","doi":"https://doi.org/10.48550/arxiv.2605.08665"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.08665","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.08665","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.08665","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135930301","display_name":"Siqi Fan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fan, Siqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135973336","display_name":"Minghao Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Minghao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135979561","display_name":"Xiaoqian Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Xiaoqian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135944694","display_name":"Xiusheng Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Xiusheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135924853","display_name":"Zhuo Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Zhuo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135944426","display_name":"Bowen Qin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qin, Bowen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016293831","display_name":"Liujie Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Liujie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135997763","display_name":"Shuo Shang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shang, Shuo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5103275486","display_name":"Weihang Chen","orcid":"https://orcid.org/0000-0003-1380-7631"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Weihang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3077999949455261,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3077999949455261,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.08990000188350677,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.08290000259876251,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.620199978351593},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.6183000206947327},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5328999757766724},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.5076000094413757},{"id":"https://openalex.org/keywords/ideal","display_name":"Ideal (ethics)","score":0.4986000061035156},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.49630001187324524},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.45509999990463257}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7386000156402588},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.620199978351593},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.6183000206947327},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5695000290870667},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5328999757766724},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.5076000094413757},{"id":"https://openalex.org/C2776639384","wikidata":"https://www.wikidata.org/wiki/Q840396","display_name":"Ideal (ethics)","level":2,"score":0.4986000061035156},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.49630001187324524},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.45509999990463257},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36320000886917114},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.31369999051094055},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3091999888420105},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.29919999837875366},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.29660001397132874},{"id":"https://openalex.org/C93361087","wikidata":"https://www.wikidata.org/wiki/Q4426698","display_name":"Data consistency","level":2,"score":0.2824999988079071},{"id":"https://openalex.org/C83725634","wikidata":"https://www.wikidata.org/wiki/Q7268699","display_name":"Qualitative reasoning","level":2,"score":0.2773999869823456},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.26750001311302185},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.26420000195503235},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.2606000006198883},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.25119999051094055}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.08665","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.08665","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.08665","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.08665","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"reasoning":[1,18,36,97,114],"models":[2,33,115],"achieve":[3,139],"high":[4],"accuracy":[5,125],"through":[6,142],"extended":[7],"chain-of-thought":[8],"but":[9],"generate":[10],"5--8":[11],"more":[12],"tokens":[13],"than":[14],"necessary,":[15],"applying":[16],"verbose":[17],"uniformly":[19],"regardless":[20],"of":[21,85],"problem":[22],"difficulty.":[23],"We":[24],"propose":[25],"Hint":[26,104],"Tuning,":[27],"a":[28,89],"data-efficient":[29],"approach":[30],"that":[31],"teaches":[32],"to":[34],"calibrate":[35],"depth.":[37],"Our":[38],"key":[39],"insight:":[40],"the":[41,54,82,94,146],"corresponding":[42],"instruct":[43,55,95,147],"model":[44,56],"serves":[45],"as":[46],"an":[47],"ideal":[48],"difficulty":[49,86],"probe.":[50],"By":[51],"testing":[52],"what":[53],"can":[57],"solve":[58],"with":[59,145],"varying":[60],"guidance,":[61],"we":[62,138],"automatically":[63],"construct":[64],"training":[65],"data":[66,152],"across":[67,112],"three":[68],"states:":[69],"No-Hint":[70],"(direct":[71],"answer),":[72],"Sparse-Hint":[73],"(minimal":[74],"prefix),":[75],"and":[76,96,151],"Full-Hint":[77],"(complete":[78],"reasoning).":[79],"This":[80],"converts":[81],"abstract":[83],"challenge":[84],"labeling":[87],"into":[88],"measurable":[90],"consistency":[91],"check":[92],"between":[93],"models.":[98],"With":[99],"only":[100],"1K":[101],"self-annotated":[102],"samples,":[103],"Tuning":[105],"achieves":[106],"24--66%":[107],"token":[108],"reduction":[109],"(31.5%":[110],"average)":[111],"mainstream":[113],"(Qwen3-Thinking,":[116],"DeepSeek-R1-Distill)":[117],"at":[118,155],"multiple":[119],"scales":[120],"(4B--32B)":[121],"while":[122],"maintaining":[123],"competitive":[124],"on":[126],"five":[127],"benchmarks.":[128],"Unlike":[129],"methods":[130],"requiring":[131],"massive":[132],"distillation":[133],"datasets":[134],"or":[135],"expensive":[136],"RL,":[137],"superior":[140],"efficiency":[141],"simple":[143],"alignment":[144],"model's":[148],"capabilities.":[149],"Code":[150],"are":[153],"available":[154],"https://github.com/redai-infra/hint-tuning.":[156]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-13T00:00:00"}
