{"id":"https://openalex.org/W7162306973","doi":"https://doi.org/10.48550/arxiv.2605.23341","title":"Sparse Compositional Flow Matching by geometric assembly from motion primitives","display_name":"Sparse Compositional Flow Matching by geometric assembly from motion primitives","publication_year":2026,"publication_date":"2026-05-22","ids":{"openalex":"https://openalex.org/W7162306973","doi":"https://doi.org/10.48550/arxiv.2605.23341"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.23341","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.23341","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.23341","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136989193","display_name":"Yan Tang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Yan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136972580","display_name":"Yuanbo Tang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Yuanbo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136895989","display_name":"Tingyu Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Tingyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072628291","display_name":"\u9ec4\u7ecd\u4f26","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Shaolun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136916830","display_name":"Yang Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.2709999978542328,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.2709999978542328,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.24650000035762787,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.12950000166893005,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.5539000034332275},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.5209000110626221},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.5008000135421753},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.492900013923645},{"id":"https://openalex.org/keywords/motion-capture","display_name":"Motion capture","score":0.44690001010894775},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.41909998655319214},{"id":"https://openalex.org/keywords/geometric-primitive","display_name":"Geometric primitive","score":0.41769999265670776},{"id":"https://openalex.org/keywords/executable","display_name":"Executable","score":0.4002000093460083},{"id":"https://openalex.org/keywords/abstraction","display_name":"Abstraction","score":0.3896999955177307},{"id":"https://openalex.org/keywords/trace","display_name":"TRACE (psycholinguistics)","score":0.3682999908924103},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.367000013589859}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6740999817848206},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.5539000034332275},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.5209000110626221},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5051000118255615},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.5008000135421753},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.492900013923645},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4885999858379364},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4681999981403351},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.44690001010894775},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.41909998655319214},{"id":"https://openalex.org/C181095308","wikidata":"https://www.wikidata.org/wiki/Q1541599","display_name":"Geometric primitive","level":2,"score":0.41769999265670776},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.4002000093460083},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.3896999955177307},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3684999942779541},{"id":"https://openalex.org/C75291252","wikidata":"https://www.wikidata.org/wiki/Q1315756","display_name":"TRACE (psycholinguistics)","level":2,"score":0.3682999908924103},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.367000013589859},{"id":"https://openalex.org/C10912380","wikidata":"https://www.wikidata.org/wiki/Q527952","display_name":"Visual servoing","level":3,"score":0.34700000286102295},{"id":"https://openalex.org/C137800194","wikidata":"https://www.wikidata.org/wiki/Q11713455","display_name":"Interpolation (computer graphics)","level":3,"score":0.33730000257492065},{"id":"https://openalex.org/C146834321","wikidata":"https://www.wikidata.org/wiki/Q2979672","display_name":"Closure (psychology)","level":2,"score":0.32280001044273376},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.32170000672340393},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.321399986743927},{"id":"https://openalex.org/C17137986","wikidata":"https://www.wikidata.org/wiki/Q215067","display_name":"Orthogonality","level":2,"score":0.31850001215934753},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.31700000166893005},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.3156999945640564},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.31450000405311584},{"id":"https://openalex.org/C202615002","wikidata":"https://www.wikidata.org/wiki/Q783507","display_name":"Differentiable function","level":2,"score":0.31049999594688416},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.3093999922275543},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.3046000003814697},{"id":"https://openalex.org/C2779190172","wikidata":"https://www.wikidata.org/wiki/Q4913888","display_name":"Binary data","level":3,"score":0.2971000075340271},{"id":"https://openalex.org/C38349280","wikidata":"https://www.wikidata.org/wiki/Q1434290","display_name":"Flow (mathematics)","level":2,"score":0.2892000079154968},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.2816999852657318},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.27379998564720154},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.27239999175071716},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.27090001106262207},{"id":"https://openalex.org/C184720557","wikidata":"https://www.wikidata.org/wiki/Q7825049","display_name":"Topology (electrical circuits)","level":2,"score":0.2705000042915344},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.27000001072883606},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.2685000002384186},{"id":"https://openalex.org/C4069607","wikidata":"https://www.wikidata.org/wiki/Q868732","display_name":"Aliasing","level":3,"score":0.2678000032901764},{"id":"https://openalex.org/C118930307","wikidata":"https://www.wikidata.org/wiki/Q600590","display_name":"Tuple","level":2,"score":0.26109999418258667},{"id":"https://openalex.org/C130440534","wikidata":"https://www.wikidata.org/wiki/Q14946528","display_name":"Conflation","level":2,"score":0.2603999972343445}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.23341","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.23341","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.23341","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.23341","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Embodied":[0],"trajectories,":[1],"such":[2],"as":[3,29,85],"the":[4,45,50,57,132,160,164,209,216,232],"executable":[5],"motion":[6,78,91],"sequences":[7],"of":[8,20,89],"robotic":[9],"manipulators,":[10],"underwater":[11],"vehicles,":[12],"and":[13,93,114,155,188,197,207,214,227],"mobile":[14],"robots,":[15],"are":[16],"a":[17,30,65,70,86,111,137,151,181,189],"fundamental":[18],"output":[19],"embodied":[21,74],"AI.":[22],"Modern":[23],"generative":[24,59],"models":[25],"often":[26],"treat":[27],"them":[28],"dense,":[31],"monolithic":[32],"signal":[33],"generated":[34],"point":[35],"by":[36,56,225,229],"point,":[37],"fitting":[38],"an":[39],"intricate":[40],"high-dimensional":[41],"posterior":[42],"while":[43],"leaving":[44],"data's":[46],"latent":[47,67,112],"structure":[48,68],"unmodeled,":[49],"same":[51],"sample":[52],"inefficiency":[53],"long":[54],"identified":[55],"structured":[58],"model":[60],"literature.":[61],"We":[62,127],"argue":[63],"that":[64,80,193],"compositional":[66,94,106],"is":[69,163,170],"natural":[71],"choice:":[72],"many":[73],"tasks":[75],"share":[76],"recurring":[77],"fragments":[79],"can":[81],"be":[82],"made":[83],"explicit":[84],"finite":[87],"repertoire":[88],"reusable":[90],"primitives,":[92],"units":[95,122],"naturally":[96],"align":[97],"with":[98,140,150,176],"subtask":[99],"boundaries":[100],"to":[101,119,123,221],"support":[102],"task":[103],"decomposition.":[104],"Existing":[105],"generators,":[107],"however,":[108],"compose":[109,129],"in":[110,131],"space":[113,135],"rely":[115],"on":[116],"post-hoc":[117],"decoding":[118],"relate":[120],"sampled":[121],"actual":[124],"trajectory":[125,134],"segments.":[126],"instead":[128],"directly":[130],"physical":[133],"through":[136],"flow-matching":[138],"framework":[139,210],"two":[141],"coupled":[142],"designs.":[143],"Motion-Primitive":[144],"Dictionary":[145],"Learning":[146],"equips":[147],"each":[148],"atom":[149,161],"learnable":[152],"length":[153],"mask":[154],"binary":[156,182],"starting":[157],"indicators":[158],"so":[159],"itself":[162],"primitive,":[165],"reused":[166],"verbatim":[167],"wherever":[168],"it":[169],"placed.":[171],"Structural":[172],"Sparse":[173],"Flow":[174],"Matching":[175],"Geometric":[177],"Constraints":[178],"then":[179],"generates":[180],"placement":[183],"matrix":[184],"using":[185],"duration-aware":[186],"tokenization":[187],"differentiable":[190],"geometric":[191],"loss":[192],"enforces":[194],"spatial":[195],"continuity":[196],"temporal":[198],"contiguity":[199],"where":[200],"adjacent":[201],"primitives":[202],"meet.":[203],"On":[204],"Open":[205],"X-Embodiment":[206],"3DMoTraj,":[208],"attains":[211],"state-of-the-art":[212],"accuracy":[213],"reduces":[215],"FDE/ADE":[217],"ratio":[218],"from":[219],"1.8":[220],"1.07,":[222],"improving":[223],"ADE":[224],"19.2%":[226],"FDE":[228],"21.0%":[230],"over":[231],"strongest":[233],"baseline.":[234]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-26T00:00:00"}
