{"id":"https://openalex.org/W4417104505","doi":"https://doi.org/10.1109/lra.2026.3673898","title":"Rethinking Transparent Object Grasping: Depth Completion With Monocular Depth Estimation and Instance Mask","display_name":"Rethinking Transparent Object Grasping: Depth Completion With Monocular Depth Estimation and Instance Mask","publication_year":2026,"publication_date":"2026-03-13","ids":{"openalex":"https://openalex.org/W4417104505","doi":"https://doi.org/10.1109/lra.2026.3673898"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2026.3673898","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2026.3673898","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2508.02507","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027056395","display_name":"Yaofeng Cheng","orcid":"https://orcid.org/0000-0001-8126-7302"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yaofeng Cheng","raw_affiliation_strings":["State Key Laboratory of Robotics and System at Harbin Institute of Technology, Harbin, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics and System at Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042358251","display_name":"X. Gao","orcid":"https://orcid.org/0000-0001-7205-2318"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinkai Gao","raw_affiliation_strings":["State Key Laboratory of Robotics and System at Harbin Institute of Technology, Harbin, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics and System at Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100378893","display_name":"Sen Zhang","orcid":"https://orcid.org/0000-0002-8010-6045"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sen Zhang","raw_affiliation_strings":["State Key Laboratory of Robotics and System at Harbin Institute of Technology, Harbin, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics and System at Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114012512","display_name":"Chengang Zeng","orcid":null},"institutions":[{"id":"https://openalex.org/I146655781","display_name":"University of Liverpool","ror":"https://ror.org/04xs57h96","country_code":"GB","type":"education","lineage":["https://openalex.org/I146655781"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Chao Zeng","raw_affiliation_strings":["Department of Computer Science, University of Liverpool, Liverpool, U.K"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Liverpool, Liverpool, U.K","institution_ids":["https://openalex.org/I146655781"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008850130","display_name":"Fusheng Zha","orcid":"https://orcid.org/0000-0001-9695-1940"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fusheng Zha","raw_affiliation_strings":["State Key Laboratory of Robotics and System at Harbin Institute of Technology, Harbin, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics and System at Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037670975","display_name":"Lin Sun","orcid":"https://orcid.org/0000-0002-8781-2057"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lining Sun","raw_affiliation_strings":["State Key Laboratory of Robotics and System at Harbin Institute of Technology, Harbin, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics and System at Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019906827","display_name":"Chenguang Yang","orcid":"https://orcid.org/0000-0001-5255-5559"},"institutions":[{"id":"https://openalex.org/I146655781","display_name":"University of Liverpool","ror":"https://ror.org/04xs57h96","country_code":"GB","type":"education","lineage":["https://openalex.org/I146655781"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Chenguang Yang","raw_affiliation_strings":["Department of Computer Science, University of Liverpool, Liverpool, U.K"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Liverpool, Liverpool, U.K","institution_ids":["https://openalex.org/I146655781"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5027056395"],"corresponding_institution_ids":["https://openalex.org/I204983213"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.00514731,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"11","issue":"5","first_page":"5510","last_page":"5517"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.6021000146865845,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.6021000146865845,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.29989999532699585,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.040800001472234726,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.842199981212616},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.7493000030517578},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5756999850273132},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5738000273704529},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5694000124931335},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.5457000136375427},{"id":"https://openalex.org/keywords/depth-map","display_name":"Depth map","score":0.4415000081062317},{"id":"https://openalex.org/keywords/depth-perception","display_name":"Depth perception","score":0.3970000147819519},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.38260000944137573}],"concepts":[{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.842199981212616},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.7493000030517578},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7071999907493591},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7032999992370605},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.592199981212616},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5756999850273132},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5738000273704529},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5694000124931335},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.5457000136375427},{"id":"https://openalex.org/C141268832","wikidata":"https://www.wikidata.org/wiki/Q2940499","display_name":"Depth map","level":3,"score":0.4415000081062317},{"id":"https://openalex.org/C52672216","wikidata":"https://www.wikidata.org/wiki/Q1749840","display_name":"Depth perception","level":3,"score":0.3970000147819519},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.38260000944137573},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.35040000081062317},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.3395000100135803},{"id":"https://openalex.org/C113346285","wikidata":"https://www.wikidata.org/wiki/Q6804193","display_name":"Measured depth","level":2,"score":0.32850000262260437},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.3240000009536743},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.31200000643730164},{"id":"https://openalex.org/C158829959","wikidata":"https://www.wikidata.org/wiki/Q1640606","display_name":"Monocular vision","level":2,"score":0.30970001220703125},{"id":"https://openalex.org/C182365436","wikidata":"https://www.wikidata.org/wiki/Q50701","display_name":"Variable (mathematics)","level":2,"score":0.30149999260902405},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.29179999232292175},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.27090001106262207},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.25839999318122864},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.2540999948978424},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.2540000081062317}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/lra.2026.3673898","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2026.3673898","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2508.02507","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.02507","pdf_url":"https://arxiv.org/pdf/2508.02507","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2508.02507","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2508.02507","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2508.02507","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.02507","pdf_url":"https://arxiv.org/pdf/2508.02507","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Accurate":[0],"depth":[1,13,20,32,46,52,89,99,153,161,166],"maps":[2],"are":[3,207],"essential":[4],"for":[5,34],"robotic":[6],"grasping.":[7],"However,":[8,51],"transparent":[9,35,87,112,132,169,179],"objects":[10,36,170],"often":[11,71],"cause":[12],"cameras":[14],"to":[15,22,44,64,73,96,109,131,137,174],"produce":[16],"missing":[17],"or":[18],"distorted":[19],"due":[21],"reflection":[23],"and":[24,59,124,134,171,187,205],"refraction,":[25],"making":[26,61],"grasping":[27],"them":[28],"particularly":[29],"challenging.":[30],"Precise":[31],"estimation":[33,100],"is":[37],"therefore":[38],"crucial.":[39],"Existing":[40],"end-to-end":[41],"methods":[42],"aim":[43],"predict":[45],"directly":[47],"from":[48,114,159],"RGB-D":[49],"inputs.":[50],"distortion":[53],"varies":[54],"significantly":[55,193],"with":[56],"environment,":[57],"viewpoint,":[58],"illumination,":[60],"it":[62],"difficult":[63],"predict.":[65],"Models":[66],"trained":[67],"on":[68],"limited":[69],"datasets":[70,186],"fail":[72],"generalize":[74],"effectively":[75],"in":[76,145,198],"real-world":[77,125,146,188],"applications.":[78,147],"In":[79],"this":[80],"letter,":[81],"we":[82,104,149],"propose":[83],"ReMake,":[84],"a":[85,106],"novel":[86],"object":[88],"completion":[90],"framework":[91],"that":[92,191],"injects":[93],"structured":[94],"priors":[95],"reformulate":[97],"the":[98,142,165,176],"learning":[101],"objective.":[102],"First,":[103],"introduce":[105],"mask":[107],"prior":[108,157],"explicitly":[110],"separate":[111],"regions":[113,133,180],"reliable":[115],"background":[116,173],"depth.":[117],"This":[118,140],"separation":[119],"ensures":[120],"consistency":[121],"between":[122,168],"training":[123],"application,":[126],"where":[127],"masked":[128],"areas":[129,136],"correspond":[130],"unmasked":[135],"opaque":[138],"ones.":[139],"improves":[141],"model's":[143],"generalizability":[144],"Second,":[148],"further":[150],"incorporate":[151],"relative":[152],"as":[154],"an":[155],"additional":[156],"obtained":[158],"monocular":[160],"estimation,":[162],"which":[163],"encodes":[164],"relationship":[167],"their":[172],"guide":[175],"reconstruction":[177],"of":[178],"more":[181],"effectively.":[182],"Extensive":[183],"experiments":[184],"across":[185],"scenes":[189],"demonstrate":[190],"ReMake":[192],"outperforms":[194],"existing":[195],"methods,":[196],"especially":[197],"different-view":[199],"prediction":[200],"experiments,":[201],"evaluating":[202],"its":[203],"generalizabilityCode":[204],"videos":[206],"available":[208],"at":[209],"<uri":[210],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[211],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">https://chengyaofeng.github.io/ReMake.github.io/</uri>.":[212]},"counts_by_year":[],"updated_date":"2026-04-01T17:29:45.350535","created_date":"2025-10-10T00:00:00"}
