{"id":"https://openalex.org/W7130577525","doi":"https://doi.org/10.1109/access.2026.3666439","title":"C3G-VM6D: Data-Efficient C3G Vision Model Aided 6D Pose Estimation Based on RGB-D Data","display_name":"C3G-VM6D: Data-Efficient C3G Vision Model Aided 6D Pose Estimation Based on RGB-D Data","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7130577525","doi":"https://doi.org/10.1109/access.2026.3666439"},"language":"en","primary_location":{"id":"doi:10.1109/access.2026.3666439","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3666439","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2026.3666439","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038968288","display_name":"Md Selim Sarowar","orcid":null},"institutions":[{"id":"https://openalex.org/I55240360","display_name":"Yeungnam University","ror":"https://ror.org/05yc6p159","country_code":"KR","type":"education","lineage":["https://openalex.org/I55240360"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Md Selim Sarowar","raw_affiliation_strings":["Department of Electronics Engineering, Yeungnam University, Gyeongsan, Republic of Korea"],"raw_orcid":"https://orcid.org/0000-0002-3158-0357","affiliations":[{"raw_affiliation_string":"Department of Electronics Engineering, Yeungnam University, Gyeongsan, Republic of Korea","institution_ids":["https://openalex.org/I55240360"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012864354","display_name":"Manar Alnaasan","orcid":null},"institutions":[{"id":"https://openalex.org/I55240360","display_name":"Yeungnam University","ror":"https://ror.org/05yc6p159","country_code":"KR","type":"education","lineage":["https://openalex.org/I55240360"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Manar Alnaasan","raw_affiliation_strings":["Department of Electronics Engineering, Yeungnam University, Gyeongsan, Republic of Korea"],"raw_orcid":"https://orcid.org/0000-0002-9110-5961","affiliations":[{"raw_affiliation_string":"Department of Electronics Engineering, Yeungnam University, Gyeongsan, Republic of Korea","institution_ids":["https://openalex.org/I55240360"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5121496446","display_name":"Sungho Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I55240360","display_name":"Yeungnam University","ror":"https://ror.org/05yc6p159","country_code":"KR","type":"education","lineage":["https://openalex.org/I55240360"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Sungho Kim","raw_affiliation_strings":["Department of Electronics Engineering, Yeungnam University, Gyeongsan, Republic of Korea"],"raw_orcid":"https://orcid.org/0000-0002-5401-2459","affiliations":[{"raw_affiliation_string":"Department of Electronics Engineering, Yeungnam University, Gyeongsan, Republic of Korea","institution_ids":["https://openalex.org/I55240360"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.22165911,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"14","issue":null,"first_page":"34223","last_page":"34238"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.935699999332428,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.935699999332428,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.02630000002682209,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.007000000216066837,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.7824000120162964},{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.6392999887466431},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5029000043869019},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.42149999737739563},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4065999984741211},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.3813999891281128},{"id":"https://openalex.org/keywords/cognitive-neuroscience-of-visual-object-recognition","display_name":"Cognitive neuroscience of visual object recognition","score":0.3813000023365021},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.3749000132083893},{"id":"https://openalex.org/keywords/3d-pose-estimation","display_name":"3D pose estimation","score":0.3490999937057495},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.3434999883174896}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.800000011920929},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.7824000120162964},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7260000109672546},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.6392999887466431},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5192000269889832},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5029000043869019},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.42149999737739563},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4065999984741211},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3813999891281128},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.3813000023365021},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.3749000132083893},{"id":"https://openalex.org/C36613465","wikidata":"https://www.wikidata.org/wiki/Q4636322","display_name":"3D pose estimation","level":3,"score":0.3490999937057495},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.3434999883174896},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.34060001373291016},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.3375999927520752},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.31130000948905945},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.30809998512268066},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.30410000681877136},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.298799991607666},{"id":"https://openalex.org/C74050887","wikidata":"https://www.wikidata.org/wiki/Q848368","display_name":"Rotation (mathematics)","level":2,"score":0.2973000109195709},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.29510000348091125},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.28529998660087585},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2840999960899353},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.28349998593330383},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.28299999237060547},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.27709999680519104},{"id":"https://openalex.org/C193415008","wikidata":"https://www.wikidata.org/wiki/Q639681","display_name":"Network architecture","level":2,"score":0.2718999981880188},{"id":"https://openalex.org/C99404194","wikidata":"https://www.wikidata.org/wiki/Q163362","display_name":"Vanishing point","level":3,"score":0.2687999904155731},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.2655999958515167},{"id":"https://openalex.org/C108882727","wikidata":"https://www.wikidata.org/wiki/Q2991685","display_name":"Solid modeling","level":2,"score":0.263700008392334},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.2621999979019165},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.25850000977516174},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2581999897956848}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2026.3666439","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3666439","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:90705c2858e34521ab552e9320bc6f24","is_oa":true,"landing_page_url":"https://doaj.org/article/90705c2858e34521ab552e9320bc6f24","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 14, Pp 34223-34238 (2026)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2026.3666439","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3666439","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3786352942","display_name":null,"funder_award_id":"B0080529002330","funder_id":"https://openalex.org/F4320323185","funder_display_name":"Ministry of Innovation and Advanced Education"}],"funders":[{"id":"https://openalex.org/F4320323185","display_name":"Ministry of Innovation and Advanced Education","ror":"https://ror.org/00n0e2d34"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W62794737","https://openalex.org/W132147841","https://openalex.org/W2125027820","https://openalex.org/W2161168419","https://openalex.org/W2560609797","https://openalex.org/W2901435296","https://openalex.org/W2949924544","https://openalex.org/W2963121255","https://openalex.org/W2963177347","https://openalex.org/W2963188159","https://openalex.org/W2963756608","https://openalex.org/W2981378444","https://openalex.org/W2989915422","https://openalex.org/W3034986117","https://openalex.org/W3035355652","https://openalex.org/W3109585842","https://openalex.org/W3112108866","https://openalex.org/W3159481202","https://openalex.org/W3179923621","https://openalex.org/W3200754113","https://openalex.org/W4214755140","https://openalex.org/W4221167997","https://openalex.org/W4224598146","https://openalex.org/W4226321491","https://openalex.org/W4285186699","https://openalex.org/W4312364980","https://openalex.org/W4312670700","https://openalex.org/W4385318467","https://openalex.org/W4390874575","https://openalex.org/W4402667891","https://openalex.org/W4402917029","https://openalex.org/W4403123434","https://openalex.org/W4403826847","https://openalex.org/W4407247244","https://openalex.org/W4407566351","https://openalex.org/W4411270197","https://openalex.org/W4413847221","https://openalex.org/W4414165747","https://openalex.org/W4414229333"],"related_works":[],"abstract_inverted_index":{"The":[0,98,150],"estimation":[1,50],"of":[2,108],"6D":[3,209],"pose":[4,32,49,210],"from":[5,33,125],"RGB-D":[6,36],"data":[7,207],"remains":[8],"challenging":[9,68],"due":[10],"to":[11,26,119],"occlusions,":[12],"textureless":[13],"objects,":[14],"and":[15,81,184,192,197],"depth":[16,126],"noise.":[17,149],"In":[18],"this":[19,67],"work,":[20],"We":[21],"introduce":[22],"a":[23,34,132],"novel":[24],"architecture":[25,75],"calculate":[27],"precisely":[28],"the":[29,156,160],"6DoF":[30],"object":[31,142],"single":[35],"image.":[37],"Unlike":[38],"existing":[39],"structures":[40],"that":[41,138,169],"rely":[42],"on":[43,56,141,159],"direct":[44],"regression":[45],"&":[46],"convolution":[47],"based":[48,62,83,199],"as":[51,53],"well":[52],"heavily":[54],"depend":[55],"large":[57],"model":[58,120],"training,":[59],"our":[60,170],"vision":[61,78],"dual":[63],"stream":[64],"approach":[65,100,137],"addresses":[66],"task":[69],"using":[70,87],"hybrid":[71],"multi":[72],"modal":[73],"fusion":[74],"combining":[76],"self-supervised":[77],"transformers":[79],"(DINOv2)":[80],"attention":[82,117,198],"point":[84,127,134],"cloud":[85,135],"processing":[86,140],"C3G":[88],"(Compact":[89],"3D":[90,122],"Gaussian":[91],"representations":[92],"integrated":[93],"with":[94,187],"Point":[95,112],"Transformer":[96,113],"V3).":[97],"DINOv2":[99],"provides":[101],"robust":[102],"semantic":[103],"understanding":[104],"without":[105],"requiring":[106],"fine-tuning":[107],"visual":[109],"backbone,":[110],"while":[111,145,180],"V3":[114],"employs":[115],"vector":[116],"mechanisms":[118],"complex":[121],"geometric":[123,200],"patterns":[124],"clouds.":[128],"Moreover,":[129],"we":[130],"present":[131],"mask-guided":[133],"extraction":[136],"concentrates":[139],"relevant":[143],"regions":[144],"filtering":[146],"out":[147],"background":[148],"model\u2019s":[151],"efficacy":[152],"is":[153],"demonstrated":[154],"by":[155],"experimental":[157],"results":[158],"LineMOD-Occluded":[161],"dataset":[162],"over":[163],"RDPN":[164],"SOTA":[165],"benchmark,":[166],"which":[167],"show":[168],"network":[171],"requires":[172],"substantially":[173],"fewer":[174],"trainable":[175],"parameters":[176],"than":[177],"fully-supervised":[178],"alternatives":[179],"achieving":[181],"competitive":[182],"performance":[183],"notable":[185],"improvements":[186],"ADD(S)":[188],"metric,":[189],"rotation":[190],"error,":[191],"translation":[193],"error.":[194],"Self-supervised":[195],"learning":[196],"reasoning":[201],"together":[202],"provide":[203],"new":[204],"era":[205],"for":[206],"efficient":[208],"estimation.":[211]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-20T00:00:00"}
