{"id":"https://openalex.org/W4386523254","doi":"https://doi.org/10.1109/tmm.2023.3311646","title":"SgVA-CLIP: Semantic-Guided Visual Adapting of Vision-Language Models for Few-Shot Image Classification","display_name":"SgVA-CLIP: Semantic-Guided Visual Adapting of Vision-Language Models for Few-Shot Image Classification","publication_year":2023,"publication_date":"2023-09-07","ids":{"openalex":"https://openalex.org/W4386523254","doi":"https://doi.org/10.1109/tmm.2023.3311646"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2023.3311646","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2023.3311646","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101801577","display_name":"Fang Peng","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Fang Peng","raw_affiliation_strings":["State Key Laboratory of Multimodal Artificial Intelligence Systems (MAIS), Institute of Automation, Chinese Academy of Sciences, Beijing, China","Peng Cheng Laboratory, Shenzhen, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3948-7413","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Multimodal Artificial Intelligence Systems (MAIS), Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210094879","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083991825","display_name":"Xiaoshan Yang","orcid":"https://orcid.org/0000-0001-5453-9755"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoshan Yang","raw_affiliation_strings":["State Key Laboratory of Multimodal Artificial Intelligence Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","Peng Cheng Laboratory, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0001-5453-9755","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Multimodal Artificial Intelligence Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100680501","display_name":"Linhui Xiao","orcid":"https://orcid.org/0000-0003-2592-5264"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Linhui Xiao","raw_affiliation_strings":["State Key Laboratory of Multimodal Artificial Intelligence Systems (MAIS), Institute of Automation, Chinese Academy of Sciences, Beijing, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","Peng Cheng Laboratory, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0003-2592-5264","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Multimodal Artificial Intelligence Systems (MAIS), Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210094879","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100631216","display_name":"Yaowei Wang","orcid":"https://orcid.org/0000-0003-2197-9038"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaowei Wang","raw_affiliation_strings":["Peng Cheng Laboratory, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0003-2197-9038","affiliations":[{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022636178","display_name":"Changsheng Xu","orcid":"https://orcid.org/0000-0001-8343-9665"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Changsheng Xu","raw_affiliation_strings":["State Key Laboratory of Multimodal Artificial Intelligence Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China","Peng Cheng Laboratory, Shenzhen, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-8343-9665","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Multimodal Artificial Intelligence Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101801577"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210094879","https://openalex.org/I4210100255","https://openalex.org/I4210136793","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":12.1524,"has_fulltext":false,"cited_by_count":72,"citation_normalized_percentile":{"value":0.99031132,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"26","issue":null,"first_page":"3469","last_page":"3480"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.9645000100135803,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8754785060882568},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7321624755859375},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.591905951499939},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.48741844296455383},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.48382845520973206},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.46290668845176697},{"id":"https://openalex.org/keywords/contextual-image-classification","display_name":"Contextual image classification","score":0.4340501129627228},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.38804900646209717},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.2512878179550171}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8754785060882568},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7321624755859375},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.591905951499939},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.48741844296455383},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.48382845520973206},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.46290668845176697},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.4340501129627228},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.38804900646209717},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2512878179550171}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2023.3311646","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2023.3311646","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1100260481","display_name":null,"funder_award_id":"62072455","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1498893086","display_name":null,"funder_award_id":"62036012","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6544960559","display_name":null,"funder_award_id":"62322212","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":67,"referenced_works":["https://openalex.org/W12634471","https://openalex.org/W24089286","https://openalex.org/W1821462560","https://openalex.org/W1846799578","https://openalex.org/W1977295328","https://openalex.org/W2017814585","https://openalex.org/W2047643928","https://openalex.org/W2108598243","https://openalex.org/W2117539524","https://openalex.org/W2138011018","https://openalex.org/W2155893237","https://openalex.org/W2155904486","https://openalex.org/W2294370754","https://openalex.org/W2533598788","https://openalex.org/W2963943197","https://openalex.org/W2964194231","https://openalex.org/W2978017171","https://openalex.org/W2985353426","https://openalex.org/W3010597097","https://openalex.org/W3012209922","https://openalex.org/W3097414768","https://openalex.org/W3105966348","https://openalex.org/W3120387732","https://openalex.org/W3128632573","https://openalex.org/W3139732141","https://openalex.org/W3163842339","https://openalex.org/W3198377975","https://openalex.org/W3198675127","https://openalex.org/W3204699193","https://openalex.org/W3205976355","https://openalex.org/W3215626407","https://openalex.org/W4200374933","https://openalex.org/W4205277845","https://openalex.org/W4206077751","https://openalex.org/W4213303451","https://openalex.org/W4221141660","https://openalex.org/W4224545477","https://openalex.org/W4226255121","https://openalex.org/W4283517970","https://openalex.org/W4285288414","https://openalex.org/W4307074156","https://openalex.org/W4312310776","https://openalex.org/W4312359569","https://openalex.org/W4312589581","https://openalex.org/W4312622641","https://openalex.org/W4313156423","https://openalex.org/W4313175608","https://openalex.org/W4313196086","https://openalex.org/W4315631108","https://openalex.org/W4386790226","https://openalex.org/W4390873714","https://openalex.org/W6600983433","https://openalex.org/W6638523607","https://openalex.org/W6638677478","https://openalex.org/W6717697761","https://openalex.org/W6748284727","https://openalex.org/W6759807521","https://openalex.org/W6763315676","https://openalex.org/W6768851824","https://openalex.org/W6775093496","https://openalex.org/W6790019176","https://openalex.org/W6791353385","https://openalex.org/W6803872405","https://openalex.org/W6809591836","https://openalex.org/W6810154958","https://openalex.org/W6839394562","https://openalex.org/W6846189718"],"related_works":["https://openalex.org/W2965546495","https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W3103844505","https://openalex.org/W259157601","https://openalex.org/W1487808658","https://openalex.org/W2761785940","https://openalex.org/W2129933262","https://openalex.org/W2005234362","https://openalex.org/W1997235926"],"abstract_inverted_index":{"Although":[0],"significant":[1],"progress":[2],"has":[3],"been":[4,44],"made":[5],"in":[6,33,48],"few-shot":[7,12,49,180],"learning,":[8],"most":[9],"of":[10,23,25,157],"existing":[11],"image":[13,181],"classification":[14],"methods":[15],"require":[16],"supervised":[17],"pre-training":[18],"on":[19,67,163],"a":[20,55,104,132,137],"large":[21],"amount":[22],"samples":[24],"base":[26],"classes,":[27],"which":[28,112],"limits":[29],"their":[30],"generalization":[31],"ability":[32],"real":[34],"world":[35],"application.":[36],"Recently,":[37],"large-scale":[38],"Vision-Language":[39],"Pre-trained":[40],"models":[41,118],"(VLPs)":[42],"have":[43],"gaining":[45],"increasing":[46],"attention":[47],"learning":[50,62,89],"because":[51],"they":[52],"can":[53,113,172],"provide":[54],"new":[56,105],"paradigm":[57],"for":[58,88],"transferable":[59],"visual":[60,76,123,170],"representation":[61],"with":[63],"easily":[64],"available":[65],"text":[66],"the":[68,71,99,149,155,158,168,175],"Web.":[69],"However,":[70],"VLPs":[72],"may":[73],"neglect":[74],"detailed":[75],"information":[77],"that":[78,167],"is":[79,145],"difficult":[80],"to":[81,93,119,147,153,178],"describe":[82],"by":[83,125],"language":[84],"sentences,":[85],"but":[86],"important":[87],"an":[90,128],"effective":[91],"classifier":[92],"distinguish":[94],"different":[95],"images.":[96],"To":[97],"address":[98],"above":[100],"problem,":[101],"we":[102],"propose":[103],"framework,":[106],"named":[107],"Semantic-guided":[108],"Visual":[109],"Adapting":[110],"(SgVA),":[111],"effectively":[114],"extend":[115],"vision-language":[116],"pre-trained":[117],"produce":[120],"discriminative":[121],"adapted":[122,169],"features":[124,171,177],"comprehensively":[126],"using":[127],"implicit":[129,142],"knowledge":[130,143,152],"distillation,":[131],"vision-specific":[133],"contrastive":[134,139],"loss,":[135],"and":[136],"cross-modal":[138,151,176],"loss.":[140],"The":[141],"distillation":[144],"designed":[146],"transfer":[148],"fine-grained":[150],"guide":[154],"updating":[156],"vision":[159],"adapter.":[160],"State-of-the-art":[161],"results":[162],"13":[164],"datasets":[165],"demonstrate":[166],"well":[173],"complement":[174],"improve":[179],"classification.":[182]},"counts_by_year":[{"year":2026,"cited_by_count":12},{"year":2025,"cited_by_count":33},{"year":2024,"cited_by_count":23},{"year":2023,"cited_by_count":4}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-10-10T00:00:00"}
