{"id":"https://openalex.org/W4402979570","doi":"https://doi.org/10.1109/icme57554.2024.10688068","title":"LR-MAE: Locate while Reconstructing with Masked Autoencoders for Point Cloud Self-supervised Learning","display_name":"LR-MAE: Locate while Reconstructing with Masked Autoencoders for Point Cloud Self-supervised Learning","publication_year":2024,"publication_date":"2024-07-15","ids":{"openalex":"https://openalex.org/W4402979570","doi":"https://doi.org/10.1109/icme57554.2024.10688068"},"language":"en","primary_location":{"id":"doi:10.1109/icme57554.2024.10688068","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme57554.2024.10688068","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102635050","display_name":"Huizhen Ji","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Huizhen Ji","raw_affiliation_strings":["Tsinghua University,Tsinghua Shenzhen International Graduate School,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Tsinghua Shenzhen International Graduate School,Shenzhen,China","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035486153","display_name":"Yaohua Zha","orcid":"https://orcid.org/0000-0001-9789-452X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]},{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaohua Zha","raw_affiliation_strings":["Tsinghua University,Tsinghua Shenzhen International Graduate School,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Tsinghua Shenzhen International Graduate School,Shenzhen,China","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111663001","display_name":"Qingmin Liao","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingmin Liao","raw_affiliation_strings":["Tsinghua University,Tsinghua Shenzhen International Graduate School,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Tsinghua Shenzhen International Graduate School,Shenzhen,China","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102635050"],"corresponding_institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.2225,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.49214349,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11164","display_name":"Remote Sensing and LiDAR Applications","score":0.9667999744415283,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11164","display_name":"Remote Sensing and LiDAR Applications","score":0.9667999744415283,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11211","display_name":"3D Surveying and Cultural Heritage","score":0.965399980545044,"subfield":{"id":"https://openalex.org/subfields/1907","display_name":"Geology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9599000215530396,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.7741985321044922},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7292854189872742},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6395003795623779},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.61871337890625},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4164116680622101},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.41123417019844055},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09270116686820984}],"concepts":[{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.7741985321044922},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7292854189872742},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6395003795623779},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.61871337890625},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4164116680622101},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41123417019844055},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09270116686820984},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme57554.2024.10688068","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme57554.2024.10688068","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W2229637417","https://openalex.org/W2889895098","https://openalex.org/W2904332125","https://openalex.org/W2988715931","https://openalex.org/W3096609285","https://openalex.org/W3116959466","https://openalex.org/W3165924482","https://openalex.org/W3184000328","https://openalex.org/W4214526701","https://openalex.org/W4214624153","https://openalex.org/W4312270234","https://openalex.org/W4312788538","https://openalex.org/W4312980726","https://openalex.org/W4313156423","https://openalex.org/W4372259856","https://openalex.org/W4372260592","https://openalex.org/W4385245566","https://openalex.org/W4386071873","https://openalex.org/W4390874204","https://openalex.org/W4393147949","https://openalex.org/W6739778489","https://openalex.org/W6755207826","https://openalex.org/W6763422710","https://openalex.org/W6784094891","https://openalex.org/W6810249204","https://openalex.org/W6839294089","https://openalex.org/W6839446344","https://openalex.org/W6841095953","https://openalex.org/W6847873191","https://openalex.org/W6849622024"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W3046775127","https://openalex.org/W3107602296","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W4364306694","https://openalex.org/W4312192474","https://openalex.org/W4283697347"],"abstract_inverted_index":{"As":[0],"an":[1],"efficient":[2],"self-supervised":[3,61],"pre-training":[4,117],"approach,":[5],"Masked":[6,68],"autoencoder":[7],"(MAE)":[8],"has":[9],"shown":[10],"promising":[11],"improvement":[12],"across":[13],"various":[14,139],"3D":[15,111],"point":[16,140],"cloud":[17,141],"understanding":[18,142],"tasks.":[19,52,100,143],"However,":[20],"the":[21,31,80,116,122,151,159,165,174],"pretext":[22],"task":[23],"of":[24,33,83],"existing":[25],"point-based":[26],"MAE":[27],"is":[28,46,75,178],"to":[29,77],"reconstruct":[30],"geometry":[32],"masked":[34,84,88],"points":[35],"only,":[36],"hence":[37],"it":[38],"learns":[39],"features":[40,95],"at":[41,91,180],"lower":[42],"semantic":[43,94],"levels":[44],"which":[45,119],"not":[47],"appropriate":[48],"for":[49,110],"high-level":[50],"downstream":[51,99,147],"To":[53],"address":[54],"this":[55],"challenge,":[56],"we":[57,102],"propose":[58],"a":[59,72,104],"novel":[60],"approach":[62],"named":[63],"Locate":[64],"while":[65,86],"Reconstructing":[66],"with":[67,98,125],"Autoencoders":[69],"(LR-MAE).":[70],"Specifically,":[71],"multi-head":[73],"decoder":[74],"designed":[76],"simultaneously":[78],"localize":[79],"global":[81],"position":[82],"patches":[85],"reconstructing":[87],"points,":[89],"aimed":[90],"learning":[92],"better":[93],"that":[96,132],"align":[97],"Moreover,":[101],"design":[103],"random":[105],"query":[106],"patch":[107],"detection":[108,113],"strategy":[109],"object":[112],"tasks":[114],"in":[115],"stage,":[118],"significantly":[120,163],"boosts":[121],"model":[123],"performance":[124,137],"faster":[126],"convergence":[127],"speed.":[128],"Extensive":[129],"experiments":[130],"show":[131],"our":[133],"LR-MAE":[134,149],"achieves":[135],"superior":[136],"on":[138,146,158,173],"By":[144],"fine-tuning":[145],"datasets,":[148],"outperforms":[150],"Point-MAE":[152],"baseline":[153,167],"by":[154,168],"3.65%":[155],"classification":[156],"accuracy":[157],"ScanObjectNN":[160],"dataset,":[161],"and":[162],"exceeds":[164],"3DETR":[166],"6.1%":[169],"AP<inf":[170],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[171],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">50</inf>":[172],"ScanNetV2":[175],"dataset.":[176],"Code":[177],"available":[179],"https://github.com/cathy-ji/LR-MAE.":[181]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-22T23:10:17.713674","created_date":"2025-10-10T00:00:00"}
