{"id":"https://openalex.org/W4387587760","doi":"https://doi.org/10.1109/lsp.2023.3324245","title":"Rotated and Masked Image Modeling: A Superior Self-Supervised Method for Classification","display_name":"Rotated and Masked Image Modeling: A Superior Self-Supervised Method for Classification","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4387587760","doi":"https://doi.org/10.1109/lsp.2023.3324245"},"language":"en","primary_location":{"id":"doi:10.1109/lsp.2023.3324245","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2023.3324245","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053349006","display_name":"Daisong Yan","orcid":"https://orcid.org/0009-0005-1563-5097"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Daisong Yan","raw_affiliation_strings":["School of Computing and Artificial Intelligence, Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Computing and Artificial Intelligence, Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078493980","display_name":"Xun Gong","orcid":"https://orcid.org/0000-0002-1494-0955"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xun Gong","raw_affiliation_strings":["School of Computing and Artificial Intelligence, Southwest Jiaotong University, Engineering Research Center of Sustainable Urban Intelligent Transportation, Ministry of Education China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Computing and Artificial Intelligence, Southwest Jiaotong University, Engineering Research Center of Sustainable Urban Intelligent Transportation, Ministry of Education China, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101463477","display_name":"Zhemin Zhang","orcid":"https://orcid.org/0000-0002-1150-1316"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhemin Zhang","raw_affiliation_strings":["School of Computing and Artificial Intelligence, Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Computing and Artificial Intelligence, Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5053349006"],"corresponding_institution_ids":["https://openalex.org/I4800084"],"apc_list":null,"apc_paid":null,"fwci":0.3685,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.60584251,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":"30","issue":null,"first_page":"1477","last_page":"1481"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12549","display_name":"Image and Object Detection Techniques","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7867703437805176},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6293942928314209},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5444797277450562},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5063866376876831},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.4232410490512848},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.41042372584342957},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1579262614250183}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7867703437805176},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6293942928314209},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5444797277450562},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5063866376876831},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.4232410490512848},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41042372584342957},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1579262614250183},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lsp.2023.3324245","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2023.3324245","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2492887464","display_name":null,"funder_award_id":"62376231","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W2097117768","https://openalex.org/W2183341477","https://openalex.org/W2194775991","https://openalex.org/W2618530766","https://openalex.org/W2765407302","https://openalex.org/W2992308087","https://openalex.org/W3005680577","https://openalex.org/W3009561768","https://openalex.org/W3094502228","https://openalex.org/W3121523901","https://openalex.org/W3131500599","https://openalex.org/W3133696297","https://openalex.org/W3138516171","https://openalex.org/W3145450063","https://openalex.org/W3156811085","https://openalex.org/W3157528469","https://openalex.org/W3176153963","https://openalex.org/W4214614183","https://openalex.org/W4221167396","https://openalex.org/W4226167593","https://openalex.org/W4312604822","https://openalex.org/W4312804044","https://openalex.org/W4313156423","https://openalex.org/W6745136726","https://openalex.org/W6774314701","https://openalex.org/W6774670964","https://openalex.org/W6784333009","https://openalex.org/W6790690058","https://openalex.org/W6794345597","https://openalex.org/W6794906783","https://openalex.org/W6798016242","https://openalex.org/W6810265253","https://openalex.org/W6810655313"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W3046775127","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W4313488044","https://openalex.org/W3107602296","https://openalex.org/W3209574120","https://openalex.org/W4312192474","https://openalex.org/W2033914206"],"abstract_inverted_index":{"Mask":[0],"image":[1,21,132],"modeling":[2],"(MIM)":[3],"has":[4,74,133],"performed":[5],"excellently":[6],"as":[7],"a":[8,61,75,97,107],"transformer-based":[9],"self-supervised":[10,63,99,150],"method":[11,65,110],"via":[12],"random":[13],"masking":[14],"and":[15,35,95,158],"reconstruction.":[16],"However,":[17],"since":[18],"the":[19,26,33,43,47,80,87,117,134],"unmasked":[20,88],"patches":[22],"are":[23],"non-participation":[24],"in":[25,130],"loss":[27],"computation,":[28],"MIM":[29],"cannot":[30],"effectively":[31],"utilize":[32,93],"data":[34,94,108],"waste":[36],"much":[37],"computation.":[38],"This":[39,137],"drawback":[40],"usually":[41],"limits":[42],"learning":[44,64],"ability":[45],"of":[46,127],"pre-training":[48,51],"model":[49],"when":[50],"on":[52,152],"small-scale":[53,67],"datasets.":[54],"To":[55],"solve":[56],"this":[57],"problem,":[58],"we":[59,105],"propose":[60,106],"novel":[62],"for":[66],"datasets":[68],"called":[69,111],"RotMIM.":[70],"Unlike":[71],"MIM,":[72],"RotMIM":[73,90,121],"different":[76],"pretext":[77],"task:":[78],"recognizing":[79],"rotation":[81],"angle":[82],"that":[83,116,123],"is":[84],"applied":[85],"to":[86,102],"patches.":[89],"can":[91],"fully":[92],"provide":[96],"stronger":[98],"signal.":[100],"Moreover,":[101],"fit":[103],"RotMIM,":[104],"augmentation":[109],"FeaMix.":[112],"Our":[113,146],"proposal":[114],"ensures":[115],"mixing":[118],"area":[119],"with":[120],"understands":[122],"each":[124],"basic":[125],"unit":[126],"semantic":[128],"information":[129],"an":[131],"same":[135],"size.":[136],"consistency":[138],"guarantees":[139],"clean":[140],"tokenization":[141],"during":[142],"fine-tuning":[143],"after":[144],"pre-training.":[145],"proposals":[147],"outperform":[148],"state-of-the-art":[149],"methods":[151],"three":[153],"popular":[154],"datasets,":[155],"Mini-ImageNet,":[156],"Caltech256,":[157],"Cifar100.":[159]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
