{"id":"https://openalex.org/W4413887381","doi":"https://doi.org/10.1109/tpami.2025.3604454","title":"Structure-Induced Gradient Regulation for Generalizable Vision-Language Models","display_name":"Structure-Induced Gradient Regulation for Generalizable Vision-Language Models","publication_year":2025,"publication_date":"2025-09-01","ids":{"openalex":"https://openalex.org/W4413887381","doi":"https://doi.org/10.1109/tpami.2025.3604454","pmid":"https://pubmed.ncbi.nlm.nih.gov/40889308"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2025.3604454","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3604454","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015420479","display_name":"Juncheng Li","orcid":"https://orcid.org/0000-0003-2258-1291"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Juncheng Li","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-2258-1291","affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061203331","display_name":"Minghe Gao","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Minghe Gao","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0009-0000-9705-5398","affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063062444","display_name":"Siliang Tang","orcid":"https://orcid.org/0000-0002-7356-9711"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siliang Tang","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-7356-9711","affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050660610","display_name":"Longhui Wei","orcid":"https://orcid.org/0000-0001-6916-3009"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Longhui Wei","raw_affiliation_strings":["Huawei, Shanghai, China","Huawei, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Huawei, Shanghai, China","institution_ids":["https://openalex.org/I2250955327"]},{"raw_affiliation_string":"Huawei, China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101485989","display_name":"Jun Xiao","orcid":"https://orcid.org/0000-0002-6142-9914"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Xiao","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-6142-9914","affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004882141","display_name":"Fei Wu","orcid":"https://orcid.org/0000-0003-2139-8807"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fei Wu","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-2139-8807","affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051332325","display_name":"Richang Hong","orcid":"https://orcid.org/0000-0001-5461-3986"},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Richang Hong","raw_affiliation_strings":["Hefei University of Technology, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0001-5461-3986","affiliations":[{"raw_affiliation_string":"Hefei University of Technology, Hefei, China","institution_ids":["https://openalex.org/I16365422"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100377147","display_name":"Meng Wang","orcid":"https://orcid.org/0000-0002-3094-7735"},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Meng Wang","raw_affiliation_strings":["Hefei University of Technology, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0002-3094-7735","affiliations":[{"raw_affiliation_string":"Hefei University of Technology, Hefei, China","institution_ids":["https://openalex.org/I16365422"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100393506","display_name":"Qi Tian","orcid":"https://orcid.org/0000-0002-7252-5047"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Tian","raw_affiliation_strings":["Huawei, Shanghai, China","Huawei, China"],"raw_orcid":"https://orcid.org/0000-0002-7252-5047","affiliations":[{"raw_affiliation_string":"Huawei, Shanghai, China","institution_ids":["https://openalex.org/I2250955327"]},{"raw_affiliation_string":"Huawei, China","institution_ids":["https://openalex.org/I2250955327"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5015420479"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.20707965,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"48","issue":"1","first_page":"219","last_page":"235"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.973800003528595,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.973800003528595,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6596612930297852},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6483461260795593},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.49940037727355957},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.37702468037605286},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32404547929763794}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6596612930297852},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6483461260795593},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.49940037727355957},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.37702468037605286},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32404547929763794}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2025.3604454","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3604454","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:40889308","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40889308","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5102038799","display_name":null,"funder_award_id":"62441617","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6689777572","display_name":null,"funder_award_id":"226-2025-00057","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W12634471","https://openalex.org/W1861492603","https://openalex.org/W1933349210","https://openalex.org/W1977295328","https://openalex.org/W2017814585","https://openalex.org/W2047643928","https://openalex.org/W2108598243","https://openalex.org/W2137825550","https://openalex.org/W2138011018","https://openalex.org/W2155904486","https://openalex.org/W2533598788","https://openalex.org/W2601243251","https://openalex.org/W2886641317","https://openalex.org/W2889326414","https://openalex.org/W2963043696","https://openalex.org/W2964105864","https://openalex.org/W2964194231","https://openalex.org/W2970641574","https://openalex.org/W3034549794","https://openalex.org/W3037492894","https://openalex.org/W3176641147","https://openalex.org/W3177096435","https://openalex.org/W3198377975","https://openalex.org/W4200635486","https://openalex.org/W4205991051","https://openalex.org/W4281487830","https://openalex.org/W4312310776","https://openalex.org/W4312651322","https://openalex.org/W4386076413","https://openalex.org/W4390873714","https://openalex.org/W4390873802","https://openalex.org/W4393155041","https://openalex.org/W4402726965","https://openalex.org/W4413146627"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407"],"abstract_inverted_index":{"Prompt":[0],"tuning,":[1],"a":[2,65,84,94,109,120,132,149,162,226],"recently":[3],"emerging":[4],"paradigm,":[5],"adapts":[6],"vision-language":[7],"pre-trained":[8],"models":[9],"to":[10,31,53,184,205],"new":[11],"tasks":[12,234],"efficiently":[13],"by":[14,29],"learning":[15,69],"\"soft":[16],"prompts\"":[17],"for":[18,38,80,89,157,193,230],"frozen":[19],"models.":[20],"However,":[21],"in":[22,93,148],"few-shot":[23],"scenarios,":[24],"its":[25],"effectiveness":[26],"is":[27,106],"limited":[28],"sensitivity":[30],"the":[32,35,49,99,186,190,200,215,241,253],"initialization":[33,79],"and":[34,83,152,176,211,235,256],"time-consuming":[36],"search":[37],"optimal":[39],"initialization,":[40],"hindering":[41],"rapid":[42],"adaptation.":[43],"Additionally,":[44],"prompt":[45,78,134,145,169],"tuning":[46,135,146,170],"risks":[47],"reducing":[48],"models'":[50],"generalizability":[51,92,258],"due":[52],"overfitting":[54],"on":[55],"scarce":[56],"training":[57],"samples.":[58],"To":[59],"overcome":[60],"these":[61],"challenges,":[62],"we":[63,160,224],"introduce":[64,225],"novel":[66,197],"Gradient-RegulAted":[67],"Meta-prompt":[68],"(GRAM)":[70],"framework":[71],"that":[72,114],"jointly":[73],"meta-learns":[74],"an":[75,178],"efficient":[76],"soft":[77],"better":[81],"adaptation":[82],"lightweight":[85],"gradient":[86,181],"regulating":[87,182],"function":[88,183],"strong":[90],"cross-domain":[91],"meta-learning":[95,125,191,203,212],"paradigm":[96],"using":[97],"only":[98,172],"weakly":[100],"labeled":[101],"image-text":[102,117],"pre-training":[103],"data.":[104],"This":[105,196],"achieved":[107],"through":[108],"Cross-Modal":[110],"Hierarchical":[111],"Clustering":[112],"algorithm":[113],"organizes":[115],"extensive":[116],"data":[118,192,204,210],"into":[119,143],"structured":[121,187],"hierarchy,":[122],"facilitating":[123,214],"robust":[124],"across":[126],"diverse":[127,242],"domains.":[128],"Rather":[129],"than":[130],"designing":[131],"specific":[133],"method,":[136],"our":[137,260],"GRAM":[138],"can":[139],"be":[140],"easily":[141],"incorporated":[142],"various":[144],"methods":[147],"model-agnostic":[150],"way":[151],"bring":[153],"about":[154],"consistent":[155],"improvement":[156],"them.":[158],"Further,":[159],"consider":[161],"more":[163],"practical":[164],"but":[165],"challenging":[166],"setting:":[167],"test-time":[168,209],"with":[171],"unlabeled":[173],"test":[174],"samples":[175],"propose":[177],"improved":[179],"structure-induced":[180],"leverage":[185],"semantics":[188,243],"of":[189,217,247,259],"zero-shot":[194,257],"generalization.":[195],"approach":[198],"exploits":[199],"hierarchically":[201],"clustered":[202],"model":[206],"relationships":[207],"between":[208],"prototypes,":[213,237],"transfer":[216],"invariant":[218],"knowledge":[219],"without":[220],"explicit":[221],"annotations.":[222],"Meanwhile,":[223],"structure":[227],"complexity-informed":[228],"strategy":[229],"adaptively":[231],"constructing":[232],"meta-training":[233],"generating":[236],"which":[238],"fully":[239],"considers":[240],"within":[244],"hierarchical":[245],"clusters":[246],"different":[248],"complexities.":[249],"Comprehensive":[250],"experiments":[251],"demonstrate":[252],"state-of-the-art":[254],"few-":[255],"method.":[261]},"counts_by_year":[],"updated_date":"2025-12-04T23:47:47.292601","created_date":"2025-10-10T00:00:00"}
