{"id":"https://openalex.org/W7131419374","doi":"https://doi.org/10.48550/arxiv.2602.19719","title":"Generative 6D Pose Estimation via Conditional Flow Matching","display_name":"Generative 6D Pose Estimation via Conditional Flow Matching","publication_year":2026,"publication_date":"2026-02-23","ids":{"openalex":"https://openalex.org/W7131419374","doi":"https://doi.org/10.48550/arxiv.2602.19719"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.19719","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19719","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.19719","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126851481","display_name":"Amir Hamza","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Hamza, Amir","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064432821","display_name":"Davide Boscaini","orcid":"https://orcid.org/0000-0003-4887-2038"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Boscaini, Davide","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126850102","display_name":"Weihang Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Weihang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107007924","display_name":"Busam Benjamin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Busam, Benjamin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5115002949","display_name":"Fabio Poiesi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Poiesi, Fabio","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5126851481"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.46230000257492065,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.46230000257492065,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.1145000010728836,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.10130000114440918,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.7102000117301941},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.6470999717712402},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.6424000263214111},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5056999921798706},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5002999901771545},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4959000051021576},{"id":"https://openalex.org/keywords/3d-pose-estimation","display_name":"3D pose estimation","score":0.4894999861717224},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4666999876499176},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.4666000008583069}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7333999872207642},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.7102000117301941},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.6470999717712402},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.6424000263214111},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6345999836921692},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5056999921798706},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5002999901771545},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4959000051021576},{"id":"https://openalex.org/C36613465","wikidata":"https://www.wikidata.org/wiki/Q4636322","display_name":"3D pose estimation","level":3,"score":0.4894999861717224},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4666999876499176},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.4666000008583069},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4278999865055084},{"id":"https://openalex.org/C22100474","wikidata":"https://www.wikidata.org/wiki/Q4800952","display_name":"Articulated body pose estimation","level":4,"score":0.37059998512268066},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36570000648498535},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.35510000586509705},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.3546999990940094},{"id":"https://openalex.org/C2983787585","wikidata":"https://www.wikidata.org/wiki/Q93586","display_name":"Feature matching","level":3,"score":0.34049999713897705},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.326200008392334},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.3102000057697296},{"id":"https://openalex.org/C38349280","wikidata":"https://www.wikidata.org/wiki/Q1434290","display_name":"Flow (mathematics)","level":2,"score":0.3059999942779541},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3050000071525574},{"id":"https://openalex.org/C152565575","wikidata":"https://www.wikidata.org/wiki/Q1124538","display_name":"Conditional random field","level":2,"score":0.3027999997138977},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.29789999127388},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.296999990940094},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.2741999924182892},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2721000015735626},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.26750001311302185},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2639000117778778}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.19719","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19719","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.19719","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19719","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Existing":[0],"methods":[1,133],"for":[2],"instance-level":[3],"6D":[4,55],"pose":[5,17,56],"estimation":[6,57],"typically":[7],"rely":[8],"on":[9,81,88,96,122],"neural":[10],"networks":[11],"that":[12,72],"either":[13],"directly":[14],"regress":[15],"the":[16,35,39,126],"in":[18,38,64],"$\\mathrm{SE}(3)$":[19],"or":[20],"estimate":[21],"it":[22],"indirectly":[23],"via":[24,76],"local":[25,43,82],"feature":[26],"matching.":[27],"The":[28],"former":[29],"struggle":[30],"with":[31,134],"object":[32,74,109],"symmetries,":[33],"while":[34],"latter":[36],"fail":[37],"absence":[40],"of":[41,54,138],"distinctive":[42],"features.":[44,83],"To":[45],"overcome":[46],"these":[47],"limitations,":[48],"we":[49],"propose":[50],"a":[51,59,69,77],"novel":[52],"formulation":[53],"as":[58],"conditional":[60,89],"flow":[61,90],"matching":[62,91],"problem":[63],"$\\mathbb{R}^3$.":[65],"We":[66,111,119],"introduce":[67],"Flose,":[68],"generative":[70],"method":[71],"infers":[73],"poses":[75],"denoising":[78,93],"process":[79],"conditioned":[80],"While":[84],"prior":[85,132],"approaches":[86],"based":[87,95],"perform":[92],"solely":[94],"geometric":[97],"guidance,":[98],"Flose":[99,121,130],"integrates":[100],"appearance-based":[101],"semantic":[102],"features":[103],"to":[104,116],"mitigate":[105],"ambiguities":[106],"caused":[107],"by":[108],"symmetries.":[110],"further":[112],"incorporate":[113],"RANSAC-based":[114],"registration":[115],"handle":[117],"outliers.":[118],"validate":[120],"five":[123],"datasets":[124],"from":[125],"established":[127],"BOP":[128],"benchmark.":[129],"outperforms":[131],"an":[135],"average":[136],"improvement":[137],"+4.5":[139],"Average":[140],"Recall.":[141],"Project":[142],"Website":[143],":":[144],"https://tev-fbk.github.io/Flose/":[145]},"counts_by_year":[],"updated_date":"2026-02-26T06:34:08.959763","created_date":"2026-02-26T00:00:00"}
