{"id":"https://openalex.org/W4388926491","doi":"https://doi.org/10.48550/arxiv.2311.11125","title":"SecondPose: SE(3)-Consistent Dual-Stream Feature Fusion for Category-Level Pose Estimation","display_name":"SecondPose: SE(3)-Consistent Dual-Stream Feature Fusion for Category-Level Pose Estimation","publication_year":2023,"publication_date":"2023-11-18","ids":{"openalex":"https://openalex.org/W4388926491","doi":"https://doi.org/10.48550/arxiv.2311.11125"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2311.11125","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2311.11125","pdf_url":"https://arxiv.org/pdf/2311.11125","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2311.11125","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002537755","display_name":"Yamei Chen","orcid":"https://orcid.org/0000-0002-9072-5157"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chen, Yamei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102634321","display_name":"Yan Di","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Di, Yan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055662103","display_name":"Guangyao Zhai","orcid":"https://orcid.org/0000-0002-1527-5387"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhai, Guangyao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006401089","display_name":"Fabian Manhardt","orcid":"https://orcid.org/0000-0002-4577-4590"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manhardt, Fabian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029834032","display_name":"Chenyangguang Zhang","orcid":"https://orcid.org/0009-0005-7852-4124"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Chenyangguang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035771614","display_name":"Ruida Zhang","orcid":"https://orcid.org/0000-0002-2693-3322"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Ruida","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041092666","display_name":"Federico Tombari","orcid":"https://orcid.org/0000-0001-5598-5212"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tombari, Federico","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046896448","display_name":"Nassir Navab","orcid":"https://orcid.org/0000-0002-6032-5611"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Navab, Nassir","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5067135033","display_name":"Benjamin Busam","orcid":"https://orcid.org/0000-0002-0620-5774"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Busam, Benjamin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5002537755"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9879999756813049,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.7126953601837158},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6806296706199646},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.655197262763977},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5430116653442383},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5383646488189697},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.47571617364883423},{"id":"https://openalex.org/keywords/invariant","display_name":"Invariant (physics)","score":0.46438300609588623},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.44265955686569214},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.42112934589385986},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.26869887113571167},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.16763952374458313}],"concepts":[{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.7126953601837158},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6806296706199646},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.655197262763977},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5430116653442383},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5383646488189697},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.47571617364883423},{"id":"https://openalex.org/C190470478","wikidata":"https://www.wikidata.org/wiki/Q2370229","display_name":"Invariant (physics)","level":2,"score":0.46438300609588623},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.44265955686569214},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.42112934589385986},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.26869887113571167},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.16763952374458313},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2311.11125","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2311.11125","pdf_url":"https://arxiv.org/pdf/2311.11125","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2311.11125","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2311.11125","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2311.11125","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2311.11125","pdf_url":"https://arxiv.org/pdf/2311.11125","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4388926491.pdf","grobid_xml":"https://content.openalex.org/works/W4388926491.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3125011624","https://openalex.org/W1508631387","https://openalex.org/W2370917603","https://openalex.org/W2952760143","https://openalex.org/W2017776670","https://openalex.org/W2347897961","https://openalex.org/W2340870721","https://openalex.org/W2358318464","https://openalex.org/W2123263858","https://openalex.org/W1834370135"],"abstract_inverted_index":{"Category-level":[0],"object":[1,95],"pose":[2,9,114],"estimation,":[3],"aiming":[4],"to":[5,76,91,106],"predict":[6],"the":[7,58,101,107,129],"6D":[8],"and":[10],"3D":[11],"size":[12],"of":[13,33,60,72],"objects":[14],"from":[15,55,103],"known":[16],"categories,":[17],"typically":[18],"struggles":[19],"with":[20,51,88],"large":[21,150],"intra-class":[22],"shape":[23],"variation.":[24,36],"Existing":[25],"works":[26],"utilizing":[27],"mean":[28],"shapes":[29],"often":[30],"fall":[31],"short":[32],"capturing":[34],"this":[35,39],"To":[37],"address":[38],"issue,":[40],"we":[41,67],"present":[42],"SecondPose,":[43],"a":[44,93,124,133,149],"novel":[45],"approach":[46],"integrating":[47],"object-specific":[48,80],"geometric":[49,74,83],"features":[50,75,84,90],"semantic":[52,65],"category":[53],"priors":[54],"DINOv2.":[56],"Leveraging":[57],"advantage":[59],"DINOv2":[61,89],"in":[62],"providing":[63],"SE(3)-consistent":[64],"features,":[66],"hierarchically":[68],"extract":[69],"two":[70],"types":[71],"SE(3)-invariant":[73],"further":[77,112],"encapsulate":[78],"local-to-global":[79],"information.":[81],"These":[82],"are":[85],"then":[86],"point-aligned":[87],"establish":[92],"consistent":[94],"representation":[96],"under":[97],"SE(3)":[98],"transformations,":[99],"facilitating":[100],"mapping":[102],"camera":[104],"space":[105],"pre-defined":[108],"canonical":[109],"space,":[110],"thus":[111],"enhancing":[113],"estimation.":[115],"Extensive":[116],"experiments":[117],"on":[118,132],"NOCS-REAL275":[119],"demonstrate":[120],"that":[121],"SecondPose":[122,143],"achieves":[123],"12.4%":[125],"leap":[126],"forward":[127],"over":[128],"state-of-the-art.":[130],"Moreover,":[131],"more":[134],"complex":[135],"dataset":[136],"HouseCat6D":[137],"which":[138],"provides":[139],"photometrically":[140],"challenging":[141],"objects,":[142],"still":[144],"surpasses":[145],"other":[146],"competitors":[147],"by":[148],"margin.":[151]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2023-11-23T00:00:00"}
