{"id":"https://openalex.org/W7151742465","doi":"https://doi.org/10.48550/arxiv.2604.05656","title":"SnapFlow: One-Step Action Generation for Flow-Matching VLAs via Progressive Self-Distillation","display_name":"SnapFlow: One-Step Action Generation for Flow-Matching VLAs via Progressive Self-Distillation","publication_year":2026,"publication_date":"2026-04-07","ids":{"openalex":"https://openalex.org/W7151742465","doi":"https://doi.org/10.48550/arxiv.2604.05656"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.05656","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05656","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.05656","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039931971","display_name":"Wuyang Luan","orcid":"https://orcid.org/0009-0005-6715-5706"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luan, Wuyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133224977","display_name":"Junhui Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Junhui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133234545","display_name":"Weiguang Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Weiguang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133224060","display_name":"Wenjian Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Wenjian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101524699","display_name":"Tao Wu","orcid":"https://orcid.org/0000-0003-4459-2696"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Tieru","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133159371","display_name":"Rui Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Rui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.7936000227928162,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.7936000227928162,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.03909999877214432,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.022600000724196434,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.5444999933242798},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5314000248908997},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.4607999920845032},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.42289999127388},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.42080000042915344},{"id":"https://openalex.org/keywords/ode","display_name":"Ode","score":0.3610999882221222},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.36070001125335693},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.3547999858856201}],"concepts":[{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.5444999933242798},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5314000248908997},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.49549999833106995},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.46950000524520874},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.4607999920845032},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.42289999127388},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.42080000042915344},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.38499999046325684},{"id":"https://openalex.org/C34862557","wikidata":"https://www.wikidata.org/wiki/Q178985","display_name":"Ode","level":2,"score":0.3610999882221222},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.36070001125335693},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.3547999858856201},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.3386000096797943},{"id":"https://openalex.org/C152565575","wikidata":"https://www.wikidata.org/wiki/Q1124538","display_name":"Conditional random field","level":2,"score":0.319599986076355},{"id":"https://openalex.org/C2780069185","wikidata":"https://www.wikidata.org/wiki/Q7977945","display_name":"Equivalence (formal languages)","level":2,"score":0.3149000108242035},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.3050999939441681},{"id":"https://openalex.org/C38349280","wikidata":"https://www.wikidata.org/wiki/Q1434290","display_name":"Flow (mathematics)","level":2,"score":0.3037000000476837},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.29499998688697815},{"id":"https://openalex.org/C22679943","wikidata":"https://www.wikidata.org/wiki/Q159375","display_name":"Standard deviation","level":2,"score":0.287200003862381},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2766000032424927},{"id":"https://openalex.org/C150921843","wikidata":"https://www.wikidata.org/wiki/Q1170431","display_name":"Resampling","level":2,"score":0.26930001378059387},{"id":"https://openalex.org/C67923128","wikidata":"https://www.wikidata.org/wiki/Q1481893","display_name":"Jacobi method","level":2,"score":0.26010000705718994},{"id":"https://openalex.org/C28034677","wikidata":"https://www.wikidata.org/wiki/Q17092530","display_name":"Interleaving","level":2,"score":0.257099986076355},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.2567000091075897}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.05656","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05656","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.05656","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05656","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Vision-Language-Action":[0],"(VLA)":[1],"models":[2],"based":[3],"on":[4,31,53,153,159,171,211,226],"flow":[5],"matching":[6,188],"--":[7,14,187,198],"such":[8],"as":[9,117],"pi0,":[10],"pi0.5,":[11],"and":[12,133,149,194,203,253],"SmolVLA":[13,212],"achieve":[15],"state-of-the-art":[16],"generalist":[17],"robotic":[18],"manipulation,":[19],"yet":[20],"their":[21],"iterative":[22],"denoising,":[23],"typically":[24],"10":[25],"ODE":[26],"steps,":[27],"introduces":[28],"substantial":[29],"latency:":[30],"a":[32,69,78,138,154,164],"modern":[33],"GPU,":[34],"denoising":[35,76,201],"alone":[36],"accounts":[37],"for":[38,63,83],"80%":[39],"of":[40],"end-to-end":[41,204,221],"inference":[42],"time.":[43],"Naively":[44],"reducing":[45],"the":[46,58,103,110,126,189,243],"step":[47],"count":[48],"is":[49,249],"unreliable,":[50],"degrading":[51],"success":[52,186],"most":[54],"tasks":[55,228],"due":[56],"to":[57,209,251],"velocity":[59,107,131],"field":[60],"being":[61],"uncalibrated":[62],"single-step":[64],"jumps.":[65],"We":[66,157],"present":[67],"SnapFlow,":[68],"plug-and-play":[70],"self-distillation":[71],"method":[72],"that":[73,230],"compresses":[74],"multi-step":[75],"into":[77],"single":[79,139,155],"forward":[80],"pass":[81],"(1-NFE)":[82],"flow-matching":[84,89],"VLAs.":[85],"SnapFlow":[86,141,182,231,248],"mixes":[87],"standard":[88],"samples":[90,93],"with":[91,168,199,219],"consistency":[92],"whose":[94],"targets":[95],"are":[96],"two-step":[97],"Euler":[98],"shortcut":[99],"velocities":[100],"computed":[101],"from":[102,207],"model's":[104],"own":[105],"marginal":[106],"predictions,":[108],"avoiding":[109],"trajectory":[111],"drift":[112],"caused":[113],"by":[114,217],"conditional":[115],"velocities,":[116],"we":[118],"analyze":[119],"theoretically.":[120],"A":[121],"zero-initialized":[122],"target-time":[123],"embedding":[124],"lets":[125],"network":[127],"switch":[128],"between":[129],"local":[130],"estimation":[132],"global":[134],"one-step":[135],"generation":[136],"within":[137],"architecture.":[140],"requires":[142],"no":[143,146],"external":[144],"teacher,":[145],"architecture":[147],"changes,":[148],"trains":[150],"in":[151],"~12h":[152],"GPU.":[156],"validate":[158],"two":[160],"VLA":[161],"architectures":[162],"spanning":[163],"6x":[165],"parameter":[166],"range,":[167],"identical":[169],"hyperparameters:":[170],"pi0.5":[172],"(3B)":[173],"across":[174,235],"four":[175],"LIBERO":[176],"suites":[177],"(40":[178],"tasks,":[179],"400":[180],"episodes),":[181],"achieves":[183],"98.75%":[184],"average":[185],"10-step":[190],"teacher":[191],"at":[192,240],"97.75%":[193],"slightly":[195],"exceeding":[196],"it":[197,214],"9.6x":[200],"speedup":[202],"latency":[205],"reduced":[206],"274ms":[208],"83ms;":[210],"(500M),":[213],"reduces":[215],"MSE":[216],"8.3%":[218],"3.56x":[220],"acceleration.":[222],"An":[223],"action-step":[224],"sweep":[225],"long-horizon":[227],"reveals":[229],"maintains":[232],"its":[233],"advantage":[234],"execution":[236],"horizons,":[237],"achieving":[238],"93%":[239],"n_act=5":[241],"where":[242],"baseline":[244],"reaches":[245],"only":[246],"90%.":[247],"orthogonal":[250],"layer-distillation":[252],"token-pruning":[254],"approaches,":[255],"enabling":[256],"compositional":[257],"speedups.":[258]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-09T00:00:00"}
