{"id":"https://openalex.org/W4413785902","doi":"https://doi.org/10.1109/tpami.2025.3600413","title":"Towards Human-Level 3D Relative Pose Estimation: Generalizable, Training-Free, With Single Reference","display_name":"Towards Human-Level 3D Relative Pose Estimation: Generalizable, Training-Free, With Single Reference","publication_year":2025,"publication_date":"2025-08-28","ids":{"openalex":"https://openalex.org/W4413785902","doi":"https://doi.org/10.1109/tpami.2025.3600413","pmid":"https://pubmed.ncbi.nlm.nih.gov/40875424"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2025.3600413","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3600413","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101909196","display_name":"Yuan Gao","orcid":"https://orcid.org/0000-0002-7661-2367"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuan Gao","raw_affiliation_strings":["School of Artificial Intelligence, Wuhan University, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109739106","display_name":"Yajing Luo","orcid":null},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yajing Luo","raw_affiliation_strings":["School of Computer Science, Wuhan University, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101504942","display_name":"Junhong Wang","orcid":"https://orcid.org/0000-0002-6437-3311"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junhong Wang","raw_affiliation_strings":["MoreFun Studio, Tencent Games, Tencent, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"MoreFun Studio, Tencent Games, Tencent, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Kui Jia","orcid":"https://orcid.org/0000-0003-2661-5700"},"institutions":[{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kui Jia","raw_affiliation_strings":["School of Data Science, The Chinese University of Hong Kong, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"School of Data Science, The Chinese University of Hong Kong, Shenzhen, China","institution_ids":["https://openalex.org/I4210116924"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073032922","display_name":"Gui-Song Xia","orcid":"https://orcid.org/0000-0001-7660-6090"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gui-Song Xia","raw_affiliation_strings":["School of Artificial Intelligence, Wuhan University, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101909196"],"corresponding_institution_ids":["https://openalex.org/I37461747"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.21015427,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"47","issue":"12","first_page":"11417","last_page":"11430"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.701580286026001},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.6957175135612488},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.675788164138794},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.581902265548706},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.47339093685150146},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.43549519777297974},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4188401401042938},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.39499014616012573},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1257985234260559}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.701580286026001},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.6957175135612488},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.675788164138794},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.581902265548706},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.47339093685150146},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.43549519777297974},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4188401401042938},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.39499014616012573},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1257985234260559},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2025.3600413","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3600413","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:40875424","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40875424","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5372796809","display_name":null,"funder_award_id":"62306214","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7875021329","display_name":null,"funder_award_id":"62325111","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":69,"referenced_works":["https://openalex.org/W132147841","https://openalex.org/W1526868886","https://openalex.org/W1991544872","https://openalex.org/W1999534094","https://openalex.org/W2002827932","https://openalex.org/W2031367292","https://openalex.org/W2097320252","https://openalex.org/W2128019145","https://openalex.org/W2292482869","https://openalex.org/W2518714726","https://openalex.org/W2562637781","https://openalex.org/W2583683993","https://openalex.org/W2604236302","https://openalex.org/W2768879211","https://openalex.org/W2962760512","https://openalex.org/W2962783853","https://openalex.org/W2963188159","https://openalex.org/W2963756608","https://openalex.org/W2963892972","https://openalex.org/W2964249569","https://openalex.org/W2964492019","https://openalex.org/W2981378444","https://openalex.org/W2989915422","https://openalex.org/W3034268164","https://openalex.org/W3034275286","https://openalex.org/W3034597466","https://openalex.org/W3034712732","https://openalex.org/W3034986117","https://openalex.org/W3106672182","https://openalex.org/W3107992529","https://openalex.org/W3159481202","https://openalex.org/W3163945288","https://openalex.org/W3166285241","https://openalex.org/W3177069133","https://openalex.org/W3193676140","https://openalex.org/W3196328566","https://openalex.org/W3202459445","https://openalex.org/W3202538459","https://openalex.org/W3207966761","https://openalex.org/W4221167997","https://openalex.org/W4224598146","https://openalex.org/W4281557677","https://openalex.org/W4298014068","https://openalex.org/W4312296985","https://openalex.org/W4312339117","https://openalex.org/W4312359138","https://openalex.org/W4312360915","https://openalex.org/W4312445439","https://openalex.org/W4312594783","https://openalex.org/W4312933868","https://openalex.org/W4313134354","https://openalex.org/W4386066287","https://openalex.org/W4386072266","https://openalex.org/W4386075660","https://openalex.org/W4390871728","https://openalex.org/W4390872210","https://openalex.org/W4390873710","https://openalex.org/W4390874575","https://openalex.org/W4399563713","https://openalex.org/W4402667888","https://openalex.org/W4402727436","https://openalex.org/W4402727562","https://openalex.org/W4402727742","https://openalex.org/W4402753846","https://openalex.org/W4402754209","https://openalex.org/W4403510570","https://openalex.org/W4403842181","https://openalex.org/W4403941282","https://openalex.org/W4415798746"],"related_works":["https://openalex.org/W230091440","https://openalex.org/W2233261550","https://openalex.org/W2810751659","https://openalex.org/W258997015","https://openalex.org/W2997094352","https://openalex.org/W2123263858","https://openalex.org/W3127959533","https://openalex.org/W4412817058","https://openalex.org/W3216976533","https://openalex.org/W100620283"],"abstract_inverted_index":{"Humans":[0],"can":[1,170],"easily":[2],"deduce":[3],"the":[4,78,88,102,108,111,118,142,149,153,156,161,201,207,212],"relative":[5,60,163],"pose":[6,61],"of":[7],"a":[8,18,34,56,70,92,132,166,179],"previously":[9],"unseen":[10,175],"object,":[11],"without":[12,183],"labeling":[13,184],"or":[14,185],"training,":[15],"given":[16,177],"only":[17,178],"single":[19,35,180],"query-reference":[20],"image":[21],"pair.":[22],"This":[23],"is":[24],"arguably":[25],"achieved":[26],"by":[27,52,64,107,115],"incorporating":[28],"i)":[29],"3D/2.5D":[30,66],"shape":[31,67,72],"perception":[32,68],"from":[33,73,91,117,140],"image,":[36],"ii)":[37],"render-and-compare":[38,79],"simulation,":[39],"and":[40,86,110,125,145,192,211],"iii)":[41],"rich":[42],"semantic":[43,89,112,126,146],"cue":[44],"awareness":[45],"to":[46,159,174],"furnish":[47],"(coarse)":[48],"reference-query":[49],"correspondence.":[50],"Motivated":[51],"this,":[53],"we":[54],"propose":[55],"novel":[57,133],"3D":[58,162],"generalizable":[59],"estimation":[62],"method":[63,169,198],"elaborating":[65],"with":[69,81,148],"2.5D":[71,103],"an":[74,82],"RGB-D":[75,181],"reference,":[76,182],"fulfilling":[77],"paradigm":[80],"off-the-shelf":[83],"differentiable":[84,99,157],"renderer,":[85],"leveraging":[87],"cues":[90],"pretrained":[93],"model":[94],"like":[95],"DINOv2.":[96],"Specifically,":[97],"our":[98,168,196],"renderer":[100,158],"takes":[101],"rotatable":[104],"mesh":[105],"textured":[106],"RGB":[109,119,124,144],"maps":[113,127,147],"(obtained":[114],"DINOv2":[116],"input),":[120],"then":[121],"renders":[122],"new":[123],"(with":[128],"back-surface":[129],"culling)":[130],"under":[131,206],"rotated":[134],"view.":[135],"The":[136],"refinement":[137],"loss":[138],"comes":[139],"comparing":[141],"rendered":[143],"query":[150],"ones,":[151],"back-propagating":[152],"gradients":[154],"through":[155],"refine":[160],"pose.":[164],"As":[165],"result,":[167],"be":[171],"readily":[172],"applied":[173],"objects,":[176],"training.":[186],"Extensive":[187],"experiments":[188],"on":[189],"LineMOD,":[190],"LM-O,":[191],"YCB-V":[193],"show":[194],"that":[195],"training-free":[197],"significantly":[199],"outperforms":[200],"state-of-the-art":[202],"supervised":[203],"methods,":[204],"especially":[205],"rigorous":[208],"Acc@5/10/15$^\\circ$\u2218":[209],"metrics":[210],"challenging":[213],"cross-dataset":[214],"settings.":[215]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
