{"id":"https://openalex.org/W7139107679","doi":"https://doi.org/10.48550/arxiv.2603.16867","title":"Efficient Reasoning on the Edge","display_name":"Efficient Reasoning on the Edge","publication_year":2026,"publication_date":"2026-03-17","ids":{"openalex":"https://openalex.org/W7139107679","doi":"https://doi.org/10.48550/arxiv.2603.16867"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.16867","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16867","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.16867","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036869211","display_name":"Yelysei Bondarenko","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Bondarenko, Yelysei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130036952","display_name":"Thomas Hehn","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hehn, Thomas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130209181","display_name":"Rob Hesselink","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hesselink, Rob","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129833726","display_name":"Romain Lepert","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lepert, Romain","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123827941","display_name":"Fabio Valerio Massoli","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Massoli, Fabio Valerio","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013127161","display_name":"Evgeny G. Mironov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mironov, Evgeny","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013359809","display_name":"Leyla Mirvakhabova","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mirvakhabova, Leyla","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087547624","display_name":"Tribhuvanesh Orekondy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Orekondy, Tribhuvanesh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033196039","display_name":"Spyridon Stasis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stasis, Spyridon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130197491","display_name":"Andrey Kuzmin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kuzmin, Andrey","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129759739","display_name":"Anna Kuzina","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kuzina, Anna","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111645310","display_name":"Markus Nagel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nagel, Markus","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041901606","display_name":"Ankita Nayak","orcid":"https://orcid.org/0000-0001-7821-0460"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nayak, Ankita","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044001052","display_name":"Corrado Rainone","orcid":"https://orcid.org/0000-0003-0381-7254"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rainone, Corrado","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032560283","display_name":"Ork de Rooij","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"de Rooij, Ork","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129900541","display_name":"Paul N Whatmough","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Whatmough, Paul N","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083706779","display_name":"Arash Behboodi","orcid":"https://orcid.org/0000-0001-8229-2809"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Behboodi, Arash","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5055531734","display_name":"Babak Ehteshami Bejnordi","orcid":"https://orcid.org/0000-0002-6258-5687"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bejnordi, Babak Ehteshami","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":18,"corresponding_author_ids":["https://openalex.org/A5036869211"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.21649999916553497,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.21649999916553497,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.1923999935388565,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12238","display_name":"Green IT and Sustainability","score":0.041600000113248825,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.6388000249862671},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.6320000290870667},{"id":"https://openalex.org/keywords/reasoning-system","display_name":"Reasoning system","score":0.5336999893188477},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5271000266075134},{"id":"https://openalex.org/keywords/automated-reasoning","display_name":"Automated reasoning","score":0.5174999833106995},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.5005999803543091},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.4715999960899353},{"id":"https://openalex.org/keywords/mobile-device","display_name":"Mobile device","score":0.4277999997138977},{"id":"https://openalex.org/keywords/case-based-reasoning","display_name":"Case-based reasoning","score":0.4246000051498413}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8162000179290771},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.6388000249862671},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.6320000290870667},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.5336999893188477},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5271000266075134},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5242999792098999},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.5174999833106995},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.5005999803543091},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.4715999960899353},{"id":"https://openalex.org/C186967261","wikidata":"https://www.wikidata.org/wiki/Q5082128","display_name":"Mobile device","level":2,"score":0.4277999997138977},{"id":"https://openalex.org/C20162079","wikidata":"https://www.wikidata.org/wiki/Q1151406","display_name":"Case-based reasoning","level":2,"score":0.4246000051498413},{"id":"https://openalex.org/C197115733","wikidata":"https://www.wikidata.org/wiki/Q1003136","display_name":"Forcing (mathematics)","level":2,"score":0.423799991607666},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.3986000120639801},{"id":"https://openalex.org/C115086926","wikidata":"https://www.wikidata.org/wiki/Q17004651","display_name":"Causal reasoning","level":3,"score":0.3716000020503998},{"id":"https://openalex.org/C86827895","wikidata":"https://www.wikidata.org/wiki/Q7098582","display_name":"Opportunistic reasoning","level":4,"score":0.3711000084877014},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.37040001153945923},{"id":"https://openalex.org/C159032336","wikidata":"https://www.wikidata.org/wiki/Q2488768","display_name":"Non-monotonic logic","level":2,"score":0.3416999876499176},{"id":"https://openalex.org/C103057564","wikidata":"https://www.wikidata.org/wiki/Q4751139","display_name":"Analytic reasoning","level":3,"score":0.3334999978542328},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.325300008058548},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3197000026702881},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.3021000027656555},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.29989999532699585},{"id":"https://openalex.org/C83725634","wikidata":"https://www.wikidata.org/wiki/Q7268699","display_name":"Qualitative reasoning","level":2,"score":0.29679998755455017},{"id":"https://openalex.org/C155911833","wikidata":"https://www.wikidata.org/wiki/Q3817354","display_name":"Spatial intelligence","level":2,"score":0.290800005197525},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.2718000113964081},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.271699994802475},{"id":"https://openalex.org/C157170001","wikidata":"https://www.wikidata.org/wiki/Q4781507","display_name":"Applications of artificial intelligence","level":2,"score":0.2639000117778778},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.257999986410141},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.25060001015663147}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.16867","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16867","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.16867","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16867","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2,47,61],"(LLMs)":[3],"with":[4,93,111],"chain-of-thought":[5],"reasoning":[6,17,43,57,85,139,166,173],"achieve":[7],"state-of-the-art":[8],"performance":[9],"across":[10],"complex":[11],"problem-solving":[12],"tasks,":[13],"but":[14],"their":[15],"verbose":[16,67],"traces":[18,58],"and":[19,39,68,143],"large":[20,36],"context":[21],"requirements":[22],"make":[23],"them":[24],"impractical":[25],"for":[26,48,72,153,175],"edge":[27],"deployment.":[28],"These":[29],"challenges":[30],"include":[31],"high":[32],"token":[33],"generation":[34],"costs,":[35],"KV-cache":[37,145],"footprints,":[38],"inefficiencies":[40],"when":[41,141],"distilling":[42,56],"capabilities":[44],"into":[45,62],"smaller":[46,63],"mobile":[49,176,184],"devices.":[50],"Existing":[51],"approaches":[52],"often":[53],"rely":[54],"on":[55,104,157,183,188],"from":[59],"larger":[60],"models,":[64],"which":[65],"are":[66,186],"stylistically":[69],"redundant,":[70],"undesirable":[71],"on-device":[73,154],"inference.":[74,155],"In":[75],"this":[76],"work,":[77],"we":[78,119,131],"propose":[79],"a":[80,133,144],"lightweight":[81],"approach":[82],"to":[83],"enable":[84],"in":[86],"small":[87],"LLMs":[88],"using":[89],"LoRA":[90],"adapters":[91],"combined":[92],"supervised":[94],"fine-tuning.":[95],"We":[96],"further":[97],"introduce":[98],"budget":[99],"forcing":[100],"via":[101],"reinforcement":[102],"learning":[103],"these":[105],"adapters,":[106],"significantly":[107],"reducing":[108,151],"response":[109],"length":[110],"minimal":[112],"accuracy":[113,125],"loss.":[114],"To":[115],"address":[116],"memory-bound":[117],"decoding,":[118],"exploit":[120],"parallel":[121],"test-time":[122],"scaling,":[123],"improving":[124],"at":[126],"minor":[127],"latency":[128],"increase.":[129],"Finally,":[130],"present":[132],"dynamic":[134],"adapter-switching":[135],"mechanism":[136],"that":[137,160],"activates":[138],"only":[140],"needed":[142],"sharing":[146],"strategy":[147],"during":[148],"prompt":[149],"encoding,":[150],"time-to-first-token":[152],"Experiments":[156],"Qwen2.5-7B":[158],"demonstrate":[159],"our":[161,180,189],"method":[162],"achieves":[163],"efficient,":[164],"accurate":[165],"under":[167],"strict":[168],"resource":[169],"constraints,":[170],"making":[171],"LLM":[172],"practical":[174],"scenarios.":[177],"Videos":[178],"demonstrating":[179],"solution":[181],"running":[182],"devices":[185],"available":[187],"project":[190],"page.":[191]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-20T00:00:00"}
