{"id":"https://openalex.org/W4412082058","doi":"https://doi.org/10.26599/cvm.2025.9450474","title":"FastMAE: Efficient Masked Autoencoder with Offline Tokenizer","display_name":"FastMAE: Efficient Masked Autoencoder with Offline Tokenizer","publication_year":2025,"publication_date":"2025-06-01","ids":{"openalex":"https://openalex.org/W4412082058","doi":"https://doi.org/10.26599/cvm.2025.9450474"},"language":"en","primary_location":{"id":"doi:10.26599/cvm.2025.9450474","is_oa":true,"landing_page_url":"https://doi.org/10.26599/cvm.2025.9450474","pdf_url":null,"source":{"id":"https://openalex.org/S2487656537","display_name":"Computational Visual Media","issn_l":"2096-0433","issn":["2096-0433","2096-0662"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Visual Media","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.26599/cvm.2025.9450474","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101135616","display_name":"Meng-Hao Guo","orcid":"https://orcid.org/0000-0002-4128-4594"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Meng-Hao Guo","raw_affiliation_strings":["Tsinghua University,Department of Computer Science,Beijing,China,100084"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Department of Computer Science,Beijing,China,100084","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100337628","display_name":"Chen Wang","orcid":"https://orcid.org/0000-0002-9315-3780"},"institutions":[{"id":"https://openalex.org/I79576946","display_name":"University of Pennsylvania","ror":"https://ror.org/00b30xv10","country_code":"US","type":"education","lineage":["https://openalex.org/I79576946"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chen Wang","raw_affiliation_strings":["University of Pennsylvania,Philadelphia,PA,USA,19104"],"affiliations":[{"raw_affiliation_string":"University of Pennsylvania,Philadelphia,PA,USA,19104","institution_ids":["https://openalex.org/I79576946"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100431792","display_name":"Wei Liu","orcid":"https://orcid.org/0000-0002-3865-8145"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Liu","raw_affiliation_strings":["Tencent Data Platform,Shenzhen,China,518057"],"affiliations":[{"raw_affiliation_string":"Tencent Data Platform,Shenzhen,China,518057","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083982090","display_name":"Shimin Hu","orcid":"https://orcid.org/0000-0002-3284-2494"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shi-Min Hu","raw_affiliation_strings":["Tsinghua University,Department of Computer Science,Beijing,China,100084"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Department of Computer Science,Beijing,China,100084","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101135616"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.17952393,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"11","issue":"3","first_page":"483","last_page":"496"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9873999953269958,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9873999953269958,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9815999865531921,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9603000283241272,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.8600298166275024},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5729122757911682},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2774171829223633},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.09819775819778442}],"concepts":[{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.8600298166275024},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5729122757911682},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2774171829223633},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.09819775819778442}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.26599/cvm.2025.9450474","is_oa":true,"landing_page_url":"https://doi.org/10.26599/cvm.2025.9450474","pdf_url":null,"source":{"id":"https://openalex.org/S2487656537","display_name":"Computational Visual Media","issn_l":"2096-0433","issn":["2096-0433","2096-0662"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Visual Media","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:82f5f2e504224905a8024244e5d77be1","is_oa":true,"landing_page_url":"https://doaj.org/article/82f5f2e504224905a8024244e5d77be1","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computational Visual Media, Vol 11, Iss 3, Pp 483-496 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.26599/cvm.2025.9450474","is_oa":true,"landing_page_url":"https://doi.org/10.26599/cvm.2025.9450474","pdf_url":null,"source":{"id":"https://openalex.org/S2487656537","display_name":"Computational Visual Media","issn_l":"2096-0433","issn":["2096-0433","2096-0662"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Visual Media","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5981067533","display_name":null,"funder_award_id":"623B2057,62220106003","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W2108598243","https://openalex.org/W2737258237","https://openalex.org/W2798991696","https://openalex.org/W2884822772","https://openalex.org/W2963150697","https://openalex.org/W3035524453","https://openalex.org/W3096609285","https://openalex.org/W3100341797","https://openalex.org/W3108655343","https://openalex.org/W3111535274","https://openalex.org/W3121523901","https://openalex.org/W3129576130","https://openalex.org/W3131500599","https://openalex.org/W3138516171","https://openalex.org/W3159481202","https://openalex.org/W3172615411","https://openalex.org/W3175515048","https://openalex.org/W4302275239","https://openalex.org/W4312262772","https://openalex.org/W4312309398","https://openalex.org/W4312312750","https://openalex.org/W4312349930","https://openalex.org/W4312560592","https://openalex.org/W4312804044","https://openalex.org/W4313156423","https://openalex.org/W4313158203","https://openalex.org/W4322207844","https://openalex.org/W4382465386","https://openalex.org/W4385346076","https://openalex.org/W4386076084","https://openalex.org/W4386076174","https://openalex.org/W4386076385","https://openalex.org/W4386076522","https://openalex.org/W4386083047","https://openalex.org/W4386221015","https://openalex.org/W4389104669","https://openalex.org/W4401609774","https://openalex.org/W4401931559","https://openalex.org/W4401953181"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W3013693939","https://openalex.org/W2566616303","https://openalex.org/W2159052453","https://openalex.org/W3131327266","https://openalex.org/W2734887215","https://openalex.org/W2803255133","https://openalex.org/W4297051394"],"abstract_inverted_index":{"Masked":[0],"autoencoders":[1],"(MAEs)":[2],"have":[3],"recently":[4],"achieved":[5],"great":[6],"success":[7],"in":[8,45,77,97,123,169],"computer":[9,147],"vision.":[10],"They":[11],"can":[12,93,117,175],"automatically":[13],"extract":[14],"representations":[15],"from":[16,102],"unlabeled":[17],"data":[18],"and":[19,172],"improve":[20],"the":[21,48,55,72,103,137,146],"performance":[22,155],"of":[23,57,74],"various":[24],"downstream":[25],"tasks.":[26],"However,":[27],"training":[28],"an":[29,66,88,98,108],"MAE":[30,68],"model":[31],"requires":[32],"substantial":[33],"resources,":[34],"which":[35,92,132],"limits":[36],"their":[37],"accessibility":[38],"to":[39,86,156,167],"many":[40],"academic":[41],"institutions:":[42],"often":[43],"laboratories":[44],"universities":[46],"lack":[47],"necessary":[49],"resources.":[50],"This":[51],"issue":[52],"significantly":[53],"hinders":[54],"development":[56,178],"this":[58,61],"field.":[59],"In":[60],"paper,":[62],"we":[63,174],"propose":[64],"FastMAE,":[65],"efficient":[67,99,109],"approach.":[69],"Inspired":[70],"by":[71],"idea":[73],"offline":[75,89,104],"tokenizers":[76],"natural":[78],"language":[79],"processing,":[80],"FastMAE":[81,106,116],"presents":[82],"a":[83,141],"novel":[84],"way":[85],"build":[87],"vision":[90,110,148],"tokenizer,":[91,105],"provide":[94],"high-level":[95],"semantics":[96],"way.":[100],"Benefiting":[101],"becomes":[107],"learner.":[111],"Our":[112],"experiments":[113],"demonstrate":[114],"that":[115,173],"achieve":[118],"83.6%":[119],"accuracy":[120],"with":[121],"ViT-B":[122],"only":[124],"18.8":[125],"h":[126],"on":[127],"8":[128],"NVIDIA":[129],"Tesla-V100":[130],"GPUs,":[131],"is":[133],"31.3\u00d7":[134],"faster":[135],"than":[136],"original":[138],"MAE,":[139],"providing":[140],"resource":[142],"friendly":[143],"baseline":[144],"for":[145],"community.":[149],"Moreover,":[150],"it":[151],"also":[152],"achieves":[153],"comparable":[154],"state-of-the-art":[157],"methods.":[158],"We":[159],"hope":[160],"our":[161],"research":[162,171],"will":[163],"attract":[164],"more":[165],"people":[166],"engage":[168],"MAE-related":[170],"advance":[176],"its":[177],"together.":[179]},"counts_by_year":[],"updated_date":"2026-02-27T16:54:17.756197","created_date":"2025-10-10T00:00:00"}
