{"id":"https://openalex.org/W4393033964","doi":"https://doi.org/10.1109/tmm.2024.3379896","title":"Fine-Tuning for Few-Shot Image Classification by Multimodal Prototype Regularization","display_name":"Fine-Tuning for Few-Shot Image Classification by Multimodal Prototype Regularization","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4393033964","doi":"https://doi.org/10.1109/tmm.2024.3379896"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2024.3379896","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2024.3379896","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033853764","display_name":"Qianhao Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qianhao Wu","raw_affiliation_strings":["School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0002-6939-4357","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016137773","display_name":"Jiaxin Qi","orcid":"https://orcid.org/0009-0000-7127-7400"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Jiaxin Qi","raw_affiliation_strings":["School of Computer Science and Engineering, Nanyang Technological University, Singapore"],"raw_orcid":"https://orcid.org/0009-0000-7127-7400","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101818657","display_name":"Dong Zhang","orcid":"https://orcid.org/0000-0002-4543-2179"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dong Zhang","raw_affiliation_strings":["School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0002-4543-2179","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042324027","display_name":"Hanwang Zhang","orcid":"https://orcid.org/0000-0001-7374-8739"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Hanwang Zhang","raw_affiliation_strings":["School of Computer Science and Engineering, Nanyang Technological University, Singapore"],"raw_orcid":"https://orcid.org/0000-0001-7374-8739","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035112538","display_name":"Jinhui Tang","orcid":"https://orcid.org/0000-0001-9008-222X"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinhui Tang","raw_affiliation_strings":["School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0001-9008-222X","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5033853764"],"corresponding_institution_ids":["https://openalex.org/I36399199"],"apc_list":null,"apc_paid":null,"fwci":2.9802,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.91791888,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"26","issue":null,"first_page":"8543","last_page":"8556"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.978600025177002,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8355427980422974},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.697036623954773},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6869837641716003},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5531946420669556},{"id":"https://openalex.org/keywords/contextual-image-classification","display_name":"Contextual image classification","score":0.5259578227996826},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.48828768730163574},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4738098680973053},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3231702148914337},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3010174334049225}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8355427980422974},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.697036623954773},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6869837641716003},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5531946420669556},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.5259578227996826},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.48828768730163574},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4738098680973053},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3231702148914337},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3010174334049225},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2024.3379896","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2024.3379896","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4307386619","display_name":null,"funder_award_id":"AISG2-RP-2021-022","funder_id":"https://openalex.org/F4320320709","funder_display_name":"National Research Foundation Singapore"}],"funders":[{"id":"https://openalex.org/F4320320709","display_name":"National Research Foundation Singapore","ror":"https://ror.org/03cpyc314"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":84,"referenced_works":["https://openalex.org/W12634471","https://openalex.org/W1614298861","https://openalex.org/W1677182931","https://openalex.org/W1846799578","https://openalex.org/W1977295328","https://openalex.org/W2017814585","https://openalex.org/W2047643928","https://openalex.org/W2051669046","https://openalex.org/W2100031962","https://openalex.org/W2108598243","https://openalex.org/W2122528955","https://openalex.org/W2138011018","https://openalex.org/W2145215286","https://openalex.org/W2166049352","https://openalex.org/W2194775991","https://openalex.org/W2519882289","https://openalex.org/W2533598788","https://openalex.org/W2562153041","https://openalex.org/W2866912866","https://openalex.org/W2962714319","https://openalex.org/W2963785020","https://openalex.org/W2964194231","https://openalex.org/W2965572487","https://openalex.org/W2980113592","https://openalex.org/W3024314529","https://openalex.org/W3034827765","https://openalex.org/W3094219444","https://openalex.org/W3108975329","https://openalex.org/W3110057998","https://openalex.org/W3128632573","https://openalex.org/W3182683290","https://openalex.org/W3198377975","https://openalex.org/W3215626407","https://openalex.org/W4213448312","https://openalex.org/W4226058394","https://openalex.org/W4280538209","https://openalex.org/W4294170691","https://openalex.org/W4297697565","https://openalex.org/W4304098253","https://openalex.org/W4312310776","https://openalex.org/W4312601888","https://openalex.org/W4312629998","https://openalex.org/W4312651322","https://openalex.org/W4313175608","https://openalex.org/W4313477435","https://openalex.org/W4320492418","https://openalex.org/W4382240281","https://openalex.org/W4382468457","https://openalex.org/W4385245566","https://openalex.org/W4386065763","https://openalex.org/W4386072096","https://openalex.org/W4386075788","https://openalex.org/W4386075975","https://openalex.org/W4386076609","https://openalex.org/W4386076681","https://openalex.org/W4386790226","https://openalex.org/W4388976132","https://openalex.org/W4390873714","https://openalex.org/W4391244552","https://openalex.org/W6636510571","https://openalex.org/W6638677478","https://openalex.org/W6678360021","https://openalex.org/W6678470764","https://openalex.org/W6686418764","https://openalex.org/W6717697761","https://openalex.org/W6726497184","https://openalex.org/W6736057607","https://openalex.org/W6743661861","https://openalex.org/W6753311412","https://openalex.org/W6757817989","https://openalex.org/W6758126075","https://openalex.org/W6766978945","https://openalex.org/W6790019176","https://openalex.org/W6791353385","https://openalex.org/W6798805250","https://openalex.org/W6800139874","https://openalex.org/W6801488762","https://openalex.org/W6803872405","https://openalex.org/W6810334672","https://openalex.org/W6810940779","https://openalex.org/W6811013733","https://openalex.org/W6853219534","https://openalex.org/W6853702739","https://openalex.org/W6861125885"],"related_works":["https://openalex.org/W4390516098","https://openalex.org/W2181948922","https://openalex.org/W2384362569","https://openalex.org/W2142795561","https://openalex.org/W4205302943","https://openalex.org/W2561132942","https://openalex.org/W3155418658","https://openalex.org/W4243199227","https://openalex.org/W2005234362","https://openalex.org/W1997235926"],"abstract_inverted_index":{"Large":[0],"pre-trained":[1,73],"vision-language":[2],"models,":[3],"such":[4],"as":[5],"CLIP":[6,23,155],"[1],":[7],"have":[8,34],"demonstrated":[9],"remarkable":[10],"performance":[11],"in":[12,24,79],"few":[13],"shot":[14],"image":[15,43,108,129,160,171,196,205,243],"classification.":[16,161],"To":[17],"facilitate":[18],"the":[19,42,52,72,88,105,118,124,128,138,165,193,199,204,218,223,227,252,267,270],"rapid":[20],"adaptation":[21],"of":[22,120,167,195,269],"downstream":[25],"tasks":[26],"with":[27,222],"limited":[28,67],"visual":[29,49,68,74,142,210,237],"samples,":[30],"two":[31],"primary":[32],"frameworks":[33],"been":[35],"proposed.":[36],"The":[37,82],"first":[38],"framework":[39,63,84,116],"centers":[40],"on":[41,66,104,261],"encoder":[44,90],"and":[45,97,110,130,172,179,187,235,244],"introduces":[46],"a":[47,147,177],"trainable":[48,93],"classifier":[50,178,214],"after":[51],"backbone":[53],"to":[54,86,136,207,230,256],"generate":[55],"logits":[56,99],"for":[57,100,154,159,213],"each":[58,101],"object":[59],"class.":[60],"Nevertheless,":[61],"this":[62,115],"heavily":[64],"depends":[65],"features":[69,109],"extracted":[70,126],"by":[71,91,127],"encoder,":[75,206,229],"which":[76],"can":[77,163],"result":[78],"over-fitting":[80],"issues.":[81],"second":[83],"aims":[85],"optimize":[87],"text":[89,131,173,228,245],"using":[92,141,183],"soft":[94],"language":[95,139],"prompts":[96,140],"computing":[98],"class":[102],"based":[103,156],"similarity":[106],"between":[107,123],"optimized":[111],"prompt":[112,220],"features.":[113,174],"However,":[114],"encounters":[117],"issue":[119],"imperfect":[121],"alignment":[122],"representations":[125,197],"encoders,":[132],"making":[133],"it":[134],"difficult":[135],"fine-tune":[137],"samples.":[143],"This":[144],"paper":[145],"proposes":[146],"Multi-":[148],"Modal":[149],"Prototype":[150],"Regularization":[151],"(MMPR)":[152],"method":[153,273],"few-shot":[157],"fine-tuning":[158],"MMPR":[162,175,239,272],"address":[164],"challenges":[166],"effectively":[168],"utilizing":[169],"both":[170,184,242],"fine-tunes":[176],"regularizes":[180],"its":[181],"weights":[182],"image-based":[185],"(ImgPR)":[186],"text-based":[188],"(TexPR)":[189],"prototypes.":[190],"ImgPR":[191],"represents":[192,217],"mean":[194],"within":[198],"same":[200],"class,":[201,224],"derived":[202,225],"from":[203,226],"distill":[208],"specific":[209],"distribution":[211],"knowledge":[212,234],"adaptation.":[215],"TexPR":[216],"hand-crafted":[219],"associated":[221],"incorporate":[231],"general":[232],"encyclopedic":[233],"mitigate":[236],"over-fitting.":[238],"significantly":[240],"leverages":[241],"information":[246],"without":[247],"increasing":[248],"computational":[249],"complexity":[250],"during":[251],"inference":[253],"stage":[254],"compared":[255],"existing":[257],"methods.":[258,276],"Experimental":[259],"results":[260],"various":[262],"challenging":[263],"public":[264],"benchmarks":[265],"demonstrate":[266],"superiority":[268],"proposed":[271],"over":[274],"state-of-the-art":[275]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":7}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
