{"id":"https://openalex.org/W4402401230","doi":"https://doi.org/10.1109/lsp.2024.3458792","title":"Improving Visual Representations of Masked Autoencoders With Artifacts Suppression","display_name":"Improving Visual Representations of Masked Autoencoders With Artifacts Suppression","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4402401230","doi":"https://doi.org/10.1109/lsp.2024.3458792"},"language":"en","primary_location":{"id":"doi:10.1109/lsp.2024.3458792","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2024.3458792","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101601094","display_name":"Zhengwei Miao","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhengwei Miao","raw_affiliation_strings":["National Key Laboratory of Optical Field Manipulation Science and Technology, Chinese Academy of Sciences, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Optical Field Manipulation Science and Technology, Chinese Academy of Sciences, Chengdu, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007665813","display_name":"Hui Luo","orcid":"https://orcid.org/0000-0001-6698-5576"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hui Luo","raw_affiliation_strings":["National Key Laboratory of Optical Field Manipulation Science and Technology, Chinese Academy of Sciences, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Optical Field Manipulation Science and Technology, Chinese Academy of Sciences, Chengdu, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100386802","display_name":"Dongxu Liu","orcid":"https://orcid.org/0000-0003-0691-4025"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongxu Liu","raw_affiliation_strings":["National Key Laboratory of Optical Field Manipulation Science and Technology, Chinese Academy of Sciences, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Optical Field Manipulation Science and Technology, Chinese Academy of Sciences, Chengdu, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100747273","display_name":"Jianlin Zhang","orcid":"https://orcid.org/0000-0002-5284-2942"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianlin Zhang","raw_affiliation_strings":["National Key Laboratory of Optical Field Manipulation Science and Technology, Chinese Academy of Sciences, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Optical Field Manipulation Science and Technology, Chinese Academy of Sciences, Chengdu, China","institution_ids":["https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101601094"],"corresponding_institution_ids":["https://openalex.org/I19820366"],"apc_list":null,"apc_paid":null,"fwci":0.4949,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.64575092,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"31","issue":null,"first_page":"2615","last_page":"2619"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9484999775886536,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9484999775886536,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6679074764251709},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6542832255363464},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5502991676330566},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.47947272658348083},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.40468457341194153}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6679074764251709},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6542832255363464},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5502991676330566},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.47947272658348083},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.40468457341194153}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lsp.2024.3458792","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2024.3458792","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W2108598243","https://openalex.org/W2737258237","https://openalex.org/W2884822772","https://openalex.org/W3035524453","https://openalex.org/W3096831136","https://openalex.org/W3110939922","https://openalex.org/W3159481202","https://openalex.org/W4213366994","https://openalex.org/W4308503280","https://openalex.org/W4312446817","https://openalex.org/W4312804044","https://openalex.org/W4313156423","https://openalex.org/W4317496114","https://openalex.org/W4386065875","https://openalex.org/W4386066407","https://openalex.org/W4386221015","https://openalex.org/W4389104669","https://openalex.org/W4389105186","https://openalex.org/W4389371289","https://openalex.org/W4389664794","https://openalex.org/W6640963894","https://openalex.org/W6755207826","https://openalex.org/W6757817989","https://openalex.org/W6784333009","https://openalex.org/W6788135285","https://openalex.org/W6790978476","https://openalex.org/W6796761347","https://openalex.org/W6799515669","https://openalex.org/W6804160461","https://openalex.org/W6838657836","https://openalex.org/W6839263979","https://openalex.org/W6851800889","https://openalex.org/W6856857450"],"related_works":["https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2772917594","https://openalex.org/W2775347418","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Recently,":[0],"Masked":[1],"Autoencoders":[2],"(MAE)":[3],"have":[4],"gained":[5],"attention":[6,46,72],"for":[7],"their":[8],"abilities":[9],"to":[10,99,122,135],"generate":[11],"visual":[12,26],"representations":[13,27],"efficiently":[14],"through":[15],"pretext":[16],"tasks.":[17],"However,":[18],"there":[19],"has":[20],"been":[21],"little":[22],"research":[23],"evaluating":[24],"the":[25,33,41,45,52,56,71,82,94,100,103,144,149],"obtained":[28],"by":[29,43],"pre-trained":[30,53,63],"MAE":[31,54],"during":[32,55],"fine-tuning":[34,57,106,171],"process.":[35,58],"In":[36],"this":[37,90],"study,":[38],"we":[39,92,112,159],"address":[40,89],"gap":[42],"examining":[44],"maps":[47,73],"within":[48,129],"each":[49],"block":[50],"of":[51,74,86,96,151],"We":[59],"observed":[60,160],"artifacts":[61,78,98],"in":[62,70,164,170,178],"models,":[64],"which":[65],"appear":[66],"as":[67],"significant":[68],"responses":[69],"shallow":[75],"blocks.":[76],"These":[77],"may":[79],"negatively":[80],"impact":[81],"transfer":[83],"ability":[84],"performance":[85,150],"MAE.":[87],"To":[88,108],"issue,":[91],"localize":[93],"cause":[95],"these":[97,110],"asymmetry":[101],"between":[102],"pre-training":[104],"and":[105,125,174],"processes.":[107],"suppress":[109],"artifacts,":[111],"propose":[113],"a":[114,161,167,175],"novel":[115],"semantic":[116,127,179],"masking":[117,146],"strategy.":[118],"This":[119],"strategy":[120,147],"aims":[121],"preserve":[123],"complete":[124],"continuous":[126],"information":[128],"visible":[130],"patches":[131],"while":[132,155],"maintaining":[133],"randomness":[134],"facilitate":[136],"robust":[137],"representation":[138],"learning.":[139],"Experimental":[140],"results":[141],"demonstrate":[142],"that":[143],"proposed":[145],"improves":[148],"various":[152],"downstream":[153],"tasks":[154],"reducing":[156],"artifacts.":[157],"Specifically,":[158],"3.2%":[162],"improvement":[163],"linear":[165],"probing,":[166],"0.5%":[168],"enhancement":[169],"on":[172,181],"Imagenet1K,":[173],"0.6%":[176],"increase":[177],"segmentation":[180],"ADE20K.":[182]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
