{"id":"https://openalex.org/W7133301999","doi":"https://doi.org/10.48550/arxiv.2603.01469","title":"Mean-Flow based One-Step Vision-Language-Action","display_name":"Mean-Flow based One-Step Vision-Language-Action","publication_year":2026,"publication_date":"2026-03-02","ids":{"openalex":"https://openalex.org/W7133301999","doi":"https://doi.org/10.48550/arxiv.2603.01469"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.01469","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01469","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.01469","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128026592","display_name":"Yang Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chen, Yang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127990181","display_name":"Xiaoguang Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Xiaoguang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5127903259","display_name":"Bin Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Bin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5128026592"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.652400016784668,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.652400016784668,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.12139999866485596,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.035599999129772186,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5521000027656555},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.446399986743927},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.3379000127315521},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.30730000138282776},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.29820001125335693}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6378999948501587},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5521000027656555},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.446399986743927},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40549999475479126},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.3379000127315521},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3296999931335449},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.30730000138282776},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.29820001125335693},{"id":"https://openalex.org/C3018907156","wikidata":"https://www.wikidata.org/wiki/Q7785058","display_name":"Third generation","level":2,"score":0.29100000858306885},{"id":"https://openalex.org/C150415221","wikidata":"https://www.wikidata.org/wiki/Q40687","display_name":"Robotic arm","level":2,"score":0.28790000081062317},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.27300000190734863}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.01469","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01469","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.01469","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01469","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2,11,65],"FlowMatching-based":[3],"Vision-Language-Action":[4],"(VLA)":[5],"frameworks":[6],"have":[7],"demonstrated":[8],"remarkable":[9],"advantages":[10],"generating":[12],"high-frequency":[13],"action":[14,67,88],"chunks,":[15],"particularly":[16],"for":[17,130],"highly":[18],"dexterous":[19],"robotic":[20,91,132],"manipulation":[21],"tasks.":[22],"Despite":[23],"these":[24],"notable":[25],"achievements,":[26],"their":[27],"practical":[28],"applications":[29],"are":[30],"constrained":[31],"by":[32],"prolonged":[33],"generation":[34,68,83,96],"latency,":[35],"which":[36],"stems":[37],"from":[38],"inherent":[39,75],"iterative":[40],"sampling":[41],"requirements":[42],"and":[43,85,108,116],"architectural":[44],"limitations.":[45],"To":[46],"address":[47],"this":[48],"critical":[49],"bottleneck,":[50],"we":[51,60],"propose":[52],"a":[53,127],"Mean-Flow":[54,101],"based":[55,102],"One-Step":[56,103],"VLA":[57,104],"approach.":[58],"Specifically,":[59],"resolve":[61],"the":[62,66,72,95,99],"noise-induced":[63],"issues":[64],"process,":[69],"thereby":[70],"eliminating":[71],"consistency":[73],"constraints":[74],"to":[76],"conventional":[77],"Flow-Matching":[78],"methods.":[79],"This":[80],"significantly":[81],"enhances":[82],"efficiency":[84],"enables":[86],"one-step":[87],"generation.":[89],"Real-world":[90],"experiments":[92],"show":[93],"that":[94,113],"speed":[97],"of":[98,114],"proposed":[100],"is":[105],"8.7":[106],"times":[107,110],"83.9":[109],"faster":[111],"than":[112],"SmolVLA":[115],"Diffusion":[117],"Policy,":[118],"respectively.":[119],"These":[120],"results":[121],"elucidate":[122],"its":[123],"great":[124],"potential":[125],"as":[126],"high-efficiency":[128],"backbone":[129],"VLA-based":[131],"manipulation.":[133]},"counts_by_year":[],"updated_date":"2026-03-04T07:09:34.246503","created_date":"2026-03-04T00:00:00"}
