{"id":"https://openalex.org/W7128016324","doi":"https://doi.org/10.48550/arxiv.2602.05755","title":"FMPose3D: monocular 3D pose estimation via flow matching","display_name":"FMPose3D: monocular 3D pose estimation via flow matching","publication_year":2026,"publication_date":"2026-02-05","ids":{"openalex":"https://openalex.org/W7128016324","doi":"https://doi.org/10.48550/arxiv.2602.05755"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.05755","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125182396","display_name":"Ti Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Ti","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101088801","display_name":"Xiaohang Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Xiaohang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5025196309","display_name":"Mackenzie Weygandt Mathis","orcid":"https://orcid.org/0000-0001-7368-4456"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mathis, Mackenzie Weygandt","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5125182396"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.6262999773025513,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.6262999773025513,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.13179999589920044,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.10260000079870224,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.7516000270843506},{"id":"https://openalex.org/keywords/articulated-body-pose-estimation","display_name":"Articulated body pose estimation","score":0.7509999871253967},{"id":"https://openalex.org/keywords/3d-pose-estimation","display_name":"3D pose estimation","score":0.7218999862670898},{"id":"https://openalex.org/keywords/posterior-probability","display_name":"Posterior probability","score":0.477400004863739},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.47600001096725464},{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.44110000133514404},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.43970000743865967},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.41350001096725464},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.4088999927043915},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3889000117778778}],"concepts":[{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.7516000270843506},{"id":"https://openalex.org/C22100474","wikidata":"https://www.wikidata.org/wiki/Q4800952","display_name":"Articulated body pose estimation","level":4,"score":0.7509999871253967},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.722000002861023},{"id":"https://openalex.org/C36613465","wikidata":"https://www.wikidata.org/wiki/Q4636322","display_name":"3D pose estimation","level":3,"score":0.7218999862670898},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6093000173568726},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4968000054359436},{"id":"https://openalex.org/C57830394","wikidata":"https://www.wikidata.org/wiki/Q278079","display_name":"Posterior probability","level":3,"score":0.477400004863739},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.47600001096725464},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.44110000133514404},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.43970000743865967},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.41350001096725464},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.4088999927043915},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3889000117778778},{"id":"https://openalex.org/C152565575","wikidata":"https://www.wikidata.org/wiki/Q1124538","display_name":"Conditional random field","level":2,"score":0.38600000739097595},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.3847000002861023},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.375900000333786},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.3407000005245209},{"id":"https://openalex.org/C2778045648","wikidata":"https://www.wikidata.org/wiki/Q176827","display_name":"Markov random field","level":4,"score":0.3400999903678894},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.33239999413490295},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.32850000262260437},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.32749998569488525},{"id":"https://openalex.org/C52740198","wikidata":"https://www.wikidata.org/wiki/Q1539564","display_name":"Importance sampling","level":3,"score":0.32710000872612},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.29269999265670776},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.28290000557899475},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.2800000011920929},{"id":"https://openalex.org/C51955184","wikidata":"https://www.wikidata.org/wiki/Q1545585","display_name":"Stochastic differential equation","level":2,"score":0.27459999918937683},{"id":"https://openalex.org/C555745239","wikidata":"https://www.wikidata.org/wiki/Q133220","display_name":"Sonar","level":2,"score":0.27410000562667847},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2727000117301941},{"id":"https://openalex.org/C155846161","wikidata":"https://www.wikidata.org/wiki/Q1143367","display_name":"Graphical model","level":2,"score":0.26159998774528503},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.26159998774528503},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25609999895095825},{"id":"https://openalex.org/C23903533","wikidata":"https://www.wikidata.org/wiki/Q17122739","display_name":"Reprojection error","level":3,"score":0.25380000472068787},{"id":"https://openalex.org/C34862557","wikidata":"https://www.wikidata.org/wiki/Q178985","display_name":"Ode","level":2,"score":0.2531999945640564}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.05755","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.05755","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.05755","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.05755","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Monocular":[0],"3D":[1,21,72,92,115,164,188,200],"pose":[2,22,73,86,93,131,175,190,201],"estimation":[3,87,94,176],"is":[4,205],"fundamentally":[5],"ill-posed":[6],"due":[7],"to":[8,56,110],"depth":[9],"ambiguity":[10],"and":[11,179,181,193],"occlusions,":[12],"thereby":[13],"motivating":[14],"probabilistic":[15],"methods":[16,169],"that":[17,90],"generate":[18],"multiple":[19],"plausible":[20,114],"hypotheses.":[23,165],"In":[24,49],"particular,":[25],"diffusion-based":[26],"models":[27],"have":[28],"recently":[29],"demonstrated":[30],"strong":[31,196],"performance,":[32],"but":[33],"their":[34],"iterative":[35],"denoising":[36],"process":[37],"typically":[38],"requires":[39],"many":[40],"timesteps":[41],"for":[42],"each":[43],"prediction,":[44],"making":[45],"inference":[46],"computationally":[47],"expensive.":[48],"contrast,":[50],"we":[51,147],"leverage":[52],"Flow":[53],"Matching":[54],"(FM)":[55],"learn":[57],"a":[58,77,83,96,106,140,150],"velocity":[59],"field":[60],"defined":[61],"by":[62,133],"an":[63],"Ordinary":[64],"Differential":[65],"Equation":[66],"(ODE),":[67],"enabling":[68],"efficient":[69],"generation":[70],"of":[71,113],"samples":[74,104],"with":[75],"only":[76,118],"few":[78],"integration":[79],"steps.":[80],"We":[81],"propose":[82],"novel":[84],"generative":[85],"framework,":[88],"FMPose3D,":[89],"formulates":[91],"as":[95],"conditional":[97],"distribution":[98,112],"transport":[99],"problem.":[100],"It":[101],"continuously":[102],"transports":[103],"from":[105,144],"standard":[107],"Gaussian":[108],"prior":[109],"the":[111,159,171,187],"poses":[116],"conditioned":[117],"on":[119,170,186],"2D":[120],"inputs.":[121],"Although":[122],"ODE":[123],"trajectories":[124],"are":[125],"deterministic,":[126],"FMPose3D":[127,166],"naturally":[128],"generates":[129],"various":[130],"hypotheses":[132],"sampling":[134],"different":[135],"noise":[136],"seeds.":[137],"To":[138],"obtain":[139],"single":[141],"accurate":[142],"prediction":[143],"those":[145],"hypotheses,":[146],"further":[148,182],"introduce":[149],"Reprojection-based":[151],"Posterior":[152],"Expectation":[153],"Aggregation":[154],"(RPEA)":[155],"module,":[156],"which":[157],"approximates":[158],"Bayesian":[160],"posterior":[161],"expectation":[162],"over":[163],"surpasses":[167],"existing":[168],"widely":[172],"used":[173],"human":[174],"benchmarks":[177],"Human3.6M":[178],"MPI-INF-3DHP,":[180],"achieves":[183],"state-of-the-art":[184],"performance":[185,197],"animal":[189],"datasets":[191],"Animal3D":[192],"CtrlAni3D,":[194],"demonstrating":[195],"across":[198],"both":[199],"domains.":[202],"The":[203],"code":[204],"available":[206],"at":[207],"https://github.com/AdaptiveMotorControlLab/FMPose3D.":[208]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-07T00:00:00"}
