{"id":"https://openalex.org/W4387968122","doi":"https://doi.org/10.1145/3581783.3612104","title":"M3R: Masked Token Mixup and Cross-Modal Reconstruction for Zero-Shot Learning","display_name":"M3R: Masked Token Mixup and Cross-Modal Reconstruction for Zero-Shot Learning","publication_year":2023,"publication_date":"2023-10-26","ids":{"openalex":"https://openalex.org/W4387968122","doi":"https://doi.org/10.1145/3581783.3612104"},"language":"en","primary_location":{"id":"doi:10.1145/3581783.3612104","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581783.3612104","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101645107","display_name":"Peng Zhao","orcid":"https://orcid.org/0000-0002-2666-0299"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Peng Zhao","raw_affiliation_strings":["Shandong University, Jinan, China"],"affiliations":[{"raw_affiliation_string":"Shandong University, Jinan, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103211526","display_name":"Qiangchang Wang","orcid":"https://orcid.org/0000-0003-0416-8778"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiangchang Wang","raw_affiliation_strings":["Shandong University, Jinan, China"],"affiliations":[{"raw_affiliation_string":"Shandong University, Jinan, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100672590","display_name":"Yilong Yin","orcid":"https://orcid.org/0000-0002-8465-1294"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yilong Yin","raw_affiliation_strings":["Shandong University, Jinan, China"],"affiliations":[{"raw_affiliation_string":"Shandong University, Jinan, China","institution_ids":["https://openalex.org/I154099455"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101645107"],"corresponding_institution_ids":["https://openalex.org/I154099455"],"apc_list":null,"apc_paid":null,"fwci":1.037,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.8170995,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"3161","last_page":"3171"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9757999777793884,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.9739999771118164,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.687336802482605},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.638128399848938},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.5537247061729431},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4929814338684082},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.4636439383029938},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.46207550168037415},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.45456650853157043},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4293714165687561},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.39496734738349915}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.687336802482605},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.638128399848938},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.5537247061729431},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4929814338684082},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.4636439383029938},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.46207550168037415},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.45456650853157043},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4293714165687561},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.39496734738349915},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3581783.3612104","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581783.3612104","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.7400000095367432}],"awards":[{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2486014166","display_name":null,"funder_award_id":"ZR2021ZD15","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4076825138","display_name":null,"funder_award_id":"62176139","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5581446023","display_name":null,"funder_award_id":"62176139","funder_id":"https://openalex.org/F4320311026","funder_display_name":"Shandong University"},{"id":"https://openalex.org/G5977364686","display_name":null,"funder_award_id":"2022YFC3302802","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7872253039","display_name":null,"funder_award_id":"ZR2021ZD15","funder_id":"https://openalex.org/F4320311026","funder_display_name":"Shandong University"},{"id":"https://openalex.org/G8764071032","display_name":null,"funder_award_id":"2022YFC","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G8955107213","display_name":null,"funder_award_id":"Major","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320311026","display_name":"Shandong University","ror":"https://ror.org/0207yh398"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W1797268635","https://openalex.org/W2070148066","https://openalex.org/W2128532956","https://openalex.org/W2141350700","https://openalex.org/W2533598788","https://openalex.org/W2924476266","https://openalex.org/W2962716320","https://openalex.org/W2963960318","https://openalex.org/W2982234480","https://openalex.org/W2991813857","https://openalex.org/W3035655772","https://openalex.org/W3096741441","https://openalex.org/W3098404559","https://openalex.org/W3171926364","https://openalex.org/W3182605419","https://openalex.org/W3204333469","https://openalex.org/W4200633401","https://openalex.org/W4210605815","https://openalex.org/W4221152131","https://openalex.org/W4226458340","https://openalex.org/W4226487100","https://openalex.org/W4226519649","https://openalex.org/W4295917908","https://openalex.org/W4296413741","https://openalex.org/W4304083988","https://openalex.org/W4304084141","https://openalex.org/W4308503280","https://openalex.org/W4312747676","https://openalex.org/W4312762894","https://openalex.org/W4382318469","https://openalex.org/W6600459194","https://openalex.org/W6745136726","https://openalex.org/W6781630272","https://openalex.org/W6804160461"],"related_works":["https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W3103844505","https://openalex.org/W259157601","https://openalex.org/W4205463238","https://openalex.org/W2761785940","https://openalex.org/W1482209366","https://openalex.org/W2110523656","https://openalex.org/W2521627374","https://openalex.org/W2981954115"],"abstract_inverted_index":{"In":[0,23],"the":[1,16,44,77,86,98,114,140,153,176,189,235],"zero-shot":[2,35],"learning":[3],"(ZSL),":[4],"learned":[5],"representation":[6,99,122],"spaces":[7],"are":[8],"often":[9],"biased":[10],"toward":[11,46,79,178],"seen":[12,47,80,146,167,179],"classes,":[13,164],"thus":[14],"limiting":[15],"ability":[17],"to":[18,72,90,101,125,157,173,211],"predict":[19],"previously":[20],"unseen":[21,73,93,135,163,170],"classes.":[22,48,81,104,171],"this":[24,84,151],"paper,":[25],"we":[26],"propose":[27],"Masked":[28],"token":[29],"Mixup":[30,56],"and":[31,62,120,181,186,203,219,226,231,237],"cross-Modal":[32],"Reconstruction":[33,65],"for":[34,162],"learning,":[36],"termed":[37],"as":[38],"M3R,":[39],"which":[40,193],"can":[41,194,208],"significantly":[42],"alleviate":[43],"bias":[45,78,177],"The":[49],"M3R":[50,242],"mainly":[51],"consists":[52],"of":[53,216,239],"Random":[54],"Token":[55],"(RTM),":[57],"Unseen":[58],"Class":[59],"Detection":[60],"(UCD),":[61],"Hard":[63],"Cross-modal":[64],"(HCR).":[66],"Firstly,":[67],"mappings":[68],"without":[69],"proper":[70],"adaptations":[71],"classes":[74,168,180],"would":[75],"cause":[76],"To":[82,149],"address":[83],"issue,":[85],"RTM":[87,141],"is":[88,106,155,191],"introduced":[89],"generate":[91,158],"diverse":[92],"class":[94,136,147],"agents,":[95],"thereby":[96,165],"broadening":[97],"space":[100,123],"cover":[102,126],"unknown":[103],"It":[105],"applied":[107],"at":[108],"a":[109,213],"randomly":[110],"selected":[111],"layer":[112],"in":[113],"Vision":[115],"Transformer,":[116],"producing":[117],"smooth":[118],"low-":[119],"high-level":[121],"boundaries":[124],"rich":[127],"attributes.":[128],"Secondly,":[129],"it":[130],"should":[131],"be":[132,143],"noted":[133],"that":[134],"agents":[137],"generated":[138],"by":[139],"may":[142],"mixed":[144],"with":[145],"samples.":[148],"overcome":[150],"challenge,":[152],"UCD":[154],"designed":[156],"greater":[159],"entropy":[160],"values":[161],"distinguishing":[166],"from":[169],"Thirdly,":[172],"further":[174],"mitigate":[175],"explore":[182],"associations":[183],"between":[184,223],"semantics":[185],"visual":[187,227],"images,":[188],"HCR":[190],"proposed,":[192],"reconstruct":[195],"masked":[196],"pixels":[197],"based":[198],"on":[199],"few":[200],"discriminative":[201],"tokens":[202],"attribute":[204],"embeddings.":[205],"This":[206],"approach":[207],"enable":[209],"models":[210],"have":[212],"deep":[214],"understanding":[215],"image":[217],"contents":[218],"build":[220],"powerful":[221],"connections":[222],"semantic":[224],"attributes":[225],"information.":[228],"Both":[229],"qualitative":[230],"quantitative":[232],"results":[233],"demonstrate":[234],"effectiveness":[236],"usefulness":[238],"our":[240],"proposed":[241],"model.":[243]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":4}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
