{"id":"https://openalex.org/W7133811990","doi":"https://doi.org/10.48550/arxiv.2603.03380","title":"LiteVLA-Edge: Quantized On-Device Multimodal Control for Embedded Robotics","display_name":"LiteVLA-Edge: Quantized On-Device Multimodal Control for Embedded Robotics","publication_year":2026,"publication_date":"2026-03-03","ids":{"openalex":"https://openalex.org/W7133811990","doi":"https://doi.org/10.48550/arxiv.2603.03380"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.03380","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063357660","display_name":"Justin Williams","orcid":"https://orcid.org/0000-0002-0195-5509"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Williams, Justin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128145956","display_name":"Kishor Datta Gupta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gupta, Kishor Datta","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023104987","display_name":"Roy George","orcid":"https://orcid.org/0000-0003-0257-9725"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"George, Roy","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5025040269","display_name":"Mrinmoy Sarkar","orcid":"https://orcid.org/0000-0002-6524-9865"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sarkar, Mrinmoy","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5063357660"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8867999911308289,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8867999911308289,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.023600000888109207,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.013000000268220901,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.7003999948501587},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6507999897003174},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.6326000094413757},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.5835999846458435},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.4790000021457672},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.4528000056743622},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.38040000200271606},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.3702999949455261}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7020999789237976},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.7003999948501587},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6507999897003174},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.6326000094413757},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.5835999846458435},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.555899977684021},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.4790000021457672},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.4528000056743622},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.38040000200271606},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.3702999949455261},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3528999984264374},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.3301999866962433},{"id":"https://openalex.org/C150415221","wikidata":"https://www.wikidata.org/wiki/Q40687","display_name":"Robotic arm","level":2,"score":0.3278000056743622},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.31299999356269836},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3068000078201294},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3057999908924103},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2930000126361847},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.28519999980926514},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2777999937534332},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.2777000069618225},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.2757999897003174},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.26269999146461487}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.03380","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.03380","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.03380","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.03380","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Vision-Language-Action":[0],"(VLA)":[1],"models":[2,114],"provide":[3,138],"a":[4,40,78,91,98,105,139],"unified":[5],"framework":[6],"for":[7,44,109,133,142],"perception,":[8,124],"language":[9],"conditioning,":[10],"and":[11,31,65,126,137],"action":[12],"generation,":[13],"but":[14],"many":[15],"existing":[16],"systems":[17,107],"remain":[18],"difficult":[19],"to":[20],"deploy":[21],"in":[22,58,149],"embedded":[23,117],"robotic":[24],"settings":[25],"because":[26],"of":[27,82,146],"their":[28],"computational":[29],"requirements":[30],"inference":[32,47,67],"latency.":[33],"In":[34],"this":[35],"paper,":[36],"we":[37],"present":[38],"LiteVLA-Edge,":[39],"deployment-oriented":[41],"VLA":[42],"pipeline":[43],"fully":[45],"on-device":[46,147],"on":[48,116],"Jetson":[49],"Orin-class":[50],"hardware.":[51],"Our":[52],"approach":[53],"combines":[54],"supervised":[55],"image-to-action":[56],"fine-tuning":[57],"FP32":[59],"with":[60],"post-training":[61],"4-bit":[62],"GGUF":[63],"quantization":[64],"GPU-accelerated":[66],"through":[68],"the":[69],"\\texttt{llama.cpp}":[70],"runtime.":[71],"Under":[72],"our":[73,102],"deployment":[74],"configuration,":[75],"LiteVLA-Edge":[76],"achieves":[77],"mean":[79],"end-to-end":[80],"latency":[81],"150.5\\,ms":[83],"(approximately":[84],"6.6\\,Hz)":[85],"while":[86,119],"operating":[87],"entirely":[88],"offline":[89],"within":[90],"ROS~2-integrated":[92],"perception--reasoning--action":[93],"pipeline.":[94],"Rather":[95],"than":[96],"introducing":[97],"new":[99],"policy":[100],"objective,":[101],"contribution":[103],"is":[104],"practical":[106],"path":[108],"executing":[110],"compact":[111],"multimodal":[112],"control":[113,136],"locally":[115],"hardware":[118],"preserving":[120],"modular":[121],"interfaces":[122],"between":[123],"reasoning,":[125],"actuation.":[127],"These":[128],"results":[129],"establish":[130],"timing":[131],"feasibility":[132],"reactive":[134],"language-conditioned":[135],"reproducible":[140],"baseline":[141],"future":[143],"task-level":[144],"evaluation":[145],"VLAs":[148],"robotics.":[150]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-03-06T00:00:00"}
