{"id":"https://openalex.org/W4413925994","doi":"https://doi.org/10.1109/icra55743.2025.11128247","title":"A Unified End-to-End Network for Category-Level and Instance-Level Object Pose Estimation from RGB Images","display_name":"A Unified End-to-End Network for Category-Level and Instance-Level Object Pose Estimation from RGB Images","publication_year":2025,"publication_date":"2025-05-19","ids":{"openalex":"https://openalex.org/W4413925994","doi":"https://doi.org/10.1109/icra55743.2025.11128247"},"language":"en","primary_location":{"id":"doi:10.1109/icra55743.2025.11128247","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11128247","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040489711","display_name":"Jiale Ren","orcid":"https://orcid.org/0009-0002-8232-5759"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiale Ren","raw_affiliation_strings":["Peking University, Shenzhen Graduate School,State Key Laboratory of General Artificial Intelligence,China"],"affiliations":[{"raw_affiliation_string":"Peking University, Shenzhen Graduate School,State Key Laboratory of General Artificial Intelligence,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100410336","display_name":"Hong Liu","orcid":"https://orcid.org/0000-0002-9319-2819"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hong Liu","raw_affiliation_strings":["Peking University, Shenzhen Graduate School,State Key Laboratory of General Artificial Intelligence,China"],"affiliations":[{"raw_affiliation_string":"Peking University, Shenzhen Graduate School,State Key Laboratory of General Artificial Intelligence,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066220127","display_name":"Jinfu Liu","orcid":"https://orcid.org/0000-0002-5745-5036"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinfu Liu","raw_affiliation_strings":["Peking University, Shenzhen Graduate School,State Key Laboratory of General Artificial Intelligence,China"],"affiliations":[{"raw_affiliation_string":"Peking University, Shenzhen Graduate School,State Key Laboratory of General Artificial Intelligence,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111193848","display_name":"Peifeng Jiang","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peifeng Jiang","raw_affiliation_strings":["Peking University, Shenzhen Graduate School,State Key Laboratory of General Artificial Intelligence,China"],"affiliations":[{"raw_affiliation_string":"Peking University, Shenzhen Graduate School,State Key Laboratory of General Artificial Intelligence,China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5040489711"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.28620837,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"12244","last_page":"12250"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12549","display_name":"Image and Object Detection Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12549","display_name":"Image and Object Detection Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/end-to-end-principle","display_name":"End-to-end principle","score":0.8061950206756592},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6531957983970642},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6510511636734009},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6309944987297058},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5625710487365723},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.5411116480827332},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.42315560579299927}],"concepts":[{"id":"https://openalex.org/C74296488","wikidata":"https://www.wikidata.org/wiki/Q2527392","display_name":"End-to-end principle","level":2,"score":0.8061950206756592},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6531957983970642},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6510511636734009},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6309944987297058},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5625710487365723},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.5411116480827332},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.42315560579299927}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra55743.2025.11128247","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11128247","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W132147841","https://openalex.org/W2057069782","https://openalex.org/W2097649661","https://openalex.org/W2128019145","https://openalex.org/W2920961587","https://openalex.org/W2949924544","https://openalex.org/W2963150697","https://openalex.org/W2963188159","https://openalex.org/W2963892972","https://openalex.org/W2989915422","https://openalex.org/W3009516594","https://openalex.org/W3035355652","https://openalex.org/W3093548137","https://openalex.org/W3096609285","https://openalex.org/W3107372911","https://openalex.org/W3107992529","https://openalex.org/W3113383835","https://openalex.org/W3177069133","https://openalex.org/W3196328566","https://openalex.org/W3202459445","https://openalex.org/W3206934897","https://openalex.org/W4206169547","https://openalex.org/W4285541168","https://openalex.org/W4312339117","https://openalex.org/W4312801317","https://openalex.org/W4384562436","https://openalex.org/W4385245566","https://openalex.org/W4392223601","https://openalex.org/W4401416428","https://openalex.org/W4401416926"],"related_works":["https://openalex.org/W2151749779","https://openalex.org/W3179968364","https://openalex.org/W1999612375","https://openalex.org/W2123263858","https://openalex.org/W2938107654","https://openalex.org/W3127959533","https://openalex.org/W4387967917","https://openalex.org/W2736638679","https://openalex.org/W4313046826","https://openalex.org/W1968716783"],"abstract_inverted_index":{"Accurately":[0],"estimating":[1,31],"the":[2,96,148],"6-DoF":[3],"pose":[4,18,56,78,88],"of":[5,150],"objects":[6],"is":[7,58,116,171],"a":[8,38,63,68,81,104,125,131],"fundamental":[9],"challenge":[10],"in":[11,28],"computer":[12],"vision":[13],"and":[14,55,70,85,166],"robotics.":[15],"While":[16],"category-level":[17,43,165],"estimation":[19,79],"based":[20],"on":[21,47,163],"RGBD":[22],"data":[23],"has":[24],"achieved":[25],"good":[26],"performance":[27],"recent":[29],"years,":[30],"poses":[32],"solely":[33],"from":[34,52,90],"RGB":[35,53,91],"images":[36],"remains":[37],"significant":[39],"challenge.":[40],"Existing":[41],"RGB-based":[42,161],"methods":[44,162],"primarily":[45],"focus":[46],"recovering":[48],"object":[49,101,141],"point":[50,133],"clouds":[51],"images,":[54],"prediction":[57,83],"not":[59],"performed":[60],"end-to-end":[61],"by":[62],"network.":[64],"This":[65],"paper":[66],"presents":[67],"Category-level":[69],"Instance-level":[71],"Pose":[72],"Estimation":[73],"Network":[74],"(CIPE),":[75],"which":[76],"models":[77],"as":[80],"set":[82],"problem":[84],"enables":[86],"direct":[87],"regression":[89],"images.":[92],"To":[93],"further":[94],"enhance":[95],"network's":[97],"ability":[98],"to":[99,118,138],"learn":[100],"poses,":[102],"first,":[103],"novel":[105],"learnable":[106],"rotation":[107,111,120],"representation":[108],"that":[109,129,156],"redefines":[110],"learning":[112],"within":[113],"Euclidean":[114],"space":[115],"introduced":[117],"facilitate":[119],"regression.":[121],"Additionally,":[122],"we":[123],"propose":[124],"prior-query":[126],"fusion":[127],"strategy":[128],"utilizes":[130],"pre-trained":[132],"cloud":[134],"feature":[135],"extraction":[136],"network":[137],"integrate":[139],"categorical":[140],"features":[142],"with":[143],"bounding":[144],"boxes,":[145],"thereby":[146],"improving":[147],"incorporation":[149],"category":[151],"information.":[152],"Experimental":[153],"results":[154],"demonstrate":[155],"CIPE":[157],"significantly":[158],"outperforms":[159],"existing":[160],"both":[164],"instance-level":[167],"datasets.":[168],"The":[169],"code":[170],"available":[172],"at":[173],"https://github.com/jialeren/CIPE.":[174]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
